diff --git a/2b855b4bc4opt2/3479854.err b/2b855b4bc4opt1/3479854.err similarity index 100% rename from 2b855b4bc4opt2/3479854.err rename to 2b855b4bc4opt1/3479854.err diff --git a/2b855b4bc4opt2/3479854.out b/2b855b4bc4opt1/3479854.out similarity index 100% rename from 2b855b4bc4opt2/3479854.out rename to 2b855b4bc4opt1/3479854.out diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt rename to 2b855b4bc4opt1/global_step70858/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_01-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_01-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_01-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_01-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_03-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_03-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_03-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_03-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_04-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_04-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_04-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_04-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_05-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_05-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_05-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_05-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_06-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_06-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_06-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_06-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_07-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_07-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_07-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_07-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_08-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_08-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_08-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_08-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_09-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_09-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_09-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_09-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_10-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_10-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_10-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_10-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_11-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_11-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_11-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_11-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_12-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_12-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_12-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_12-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_13-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_13-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_13-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_13-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_14-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_14-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_14-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_14-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_15-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_15-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_15-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_15-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_16-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_16-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_16-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_16-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_17-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_17-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_17-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_17-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_18-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_18-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_18-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_18-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_19-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_19-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_19-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_19-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_20-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_20-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_20-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_20-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_21-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_21-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_21-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_21-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_22-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_22-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_22-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_22-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_23-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_23-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_23-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_23-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_24-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_24-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_24-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_24-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_25-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_25-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_25-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_25-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_26-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_26-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_26-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_26-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_27-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_27-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_27-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_27-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_28-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_28-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_28-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_28-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_29-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_29-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_29-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_29-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_30-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_30-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_30-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_30-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_31-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_31-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_31-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_31-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_32-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_32-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_32-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_32-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_33-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_33-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_33-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_33-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_34-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_34-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_34-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_34-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/layer_36-model_00-model_states.pt b/2b855b4bc4opt1/global_step70858/layer_36-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/layer_36-model_00-model_states.pt rename to 2b855b4bc4opt1/global_step70858/layer_36-model_00-model_states.pt diff --git a/2b855b4bc4opt2/global_step70858/mp_rank_00_model_states.pt b/2b855b4bc4opt1/global_step70858/mp_rank_00_model_states.pt similarity index 100% rename from 2b855b4bc4opt2/global_step70858/mp_rank_00_model_states.pt rename to 2b855b4bc4opt1/global_step70858/mp_rank_00_model_states.pt diff --git a/2b855b4bc4opt1/latest b/2b855b4bc4opt1/latest new file mode 100644 index 0000000000000000000000000000000000000000..dd4ed4f46fbdfdfeade5c057e176c669f8c232fa --- /dev/null +++ b/2b855b4bc4opt1/latest @@ -0,0 +1 @@ +global_step70858 \ No newline at end of file diff --git a/2b855b4bc4opt2/sbatch_2b855b4bc4opt2.sh b/2b855b4bc4opt1/sbatch_2b855b4bc4opt2.sh similarity index 100% rename from 2b855b4bc4opt2/sbatch_2b855b4bc4opt2.sh rename to 2b855b4bc4opt1/sbatch_2b855b4bc4opt2.sh diff --git a/2b855b4bc4opt2/sbatch_2b855b4bc4opt2val.sh b/2b855b4bc4opt1/sbatch_2b855b4bc4opt2val.sh similarity index 100% rename from 2b855b4bc4opt2/sbatch_2b855b4bc4opt2val.sh rename to 2b855b4bc4opt1/sbatch_2b855b4bc4opt2val.sh diff --git a/2b855b4bc4opt2/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683359704.nid007164.87766.0 b/2b855b4bc4opt1/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683359704.nid007164.87766.0 similarity index 100% rename from 2b855b4bc4opt2/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683359704.nid007164.87766.0 rename to 2b855b4bc4opt1/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683359704.nid007164.87766.0 diff --git a/2b855b4bc4opt2/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683466010.nid006323.40463.0 b/2b855b4bc4opt1/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683466010.nid006323.40463.0 similarity index 100% rename from 2b855b4bc4opt2/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683466010.nid006323.40463.0 rename to 2b855b4bc4opt1/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683466010.nid006323.40463.0 diff --git a/2b855b4bc4opt2/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683466819.nid006037.107824.0 b/2b855b4bc4opt1/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683466819.nid006037.107824.0 similarity index 100% rename from 2b855b4bc4opt2/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683466819.nid006037.107824.0 rename to 2b855b4bc4opt1/tensorboard_2b855b4bc4opt2/events.out.tfevents.1683466819.nid006037.107824.0 diff --git a/2b855b4bc4opt2/tensorboard_2b855b4bc4opt2val/events.out.tfevents.1683533643.nid005517.37748.0 b/2b855b4bc4opt1/tensorboard_2b855b4bc4opt2val/events.out.tfevents.1683533643.nid005517.37748.0 similarity index 100% rename from 2b855b4bc4opt2/tensorboard_2b855b4bc4opt2val/events.out.tfevents.1683533643.nid005517.37748.0 rename to 2b855b4bc4opt1/tensorboard_2b855b4bc4opt2val/events.out.tfevents.1683533643.nid005517.37748.0 diff --git a/2b855b4bc4opt2/tensorboard_2b855b4bc4opt2val/events.out.tfevents.1683564137.nid006565.42760.0 b/2b855b4bc4opt1/tensorboard_2b855b4bc4opt2val/events.out.tfevents.1683564137.nid006565.42760.0 similarity index 100% rename from 2b855b4bc4opt2/tensorboard_2b855b4bc4opt2val/events.out.tfevents.1683564137.nid006565.42760.0 rename to 2b855b4bc4opt1/tensorboard_2b855b4bc4opt2val/events.out.tfevents.1683564137.nid006565.42760.0 diff --git a/2b855b4bc4opt2/3509629.err b/2b855b4bc4opt2/3509629.err new file mode 100644 index 0000000000000000000000000000000000000000..6a79cb259ad5c28bd54a524210f6220967917a42 --- /dev/null +++ b/2b855b4bc4opt2/3509629.err @@ -0,0 +1,3625 @@ +29: 2023-05-13 00:56:48.846418: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +29: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +29: 2023-05-13 00:56:48.846421: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +29: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +29: 2023-05-13 00:56:48.846431: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +14: 2023-05-13 00:56:48.846407: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +14: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +14: 2023-05-13 00:56:48.846417: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +14: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +14: 2023-05-13 00:56:48.846420: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +29: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +29: 2023-05-13 00:56:48.846437: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +29: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +29: 2023-05-13 00:56:48.846441: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +29: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +14: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +14: 2023-05-13 00:56:48.846423: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +14: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +14: 2023-05-13 00:56:48.846427: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +14: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +21: 2023-05-13 00:56:48.846500: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +21: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +21: 2023-05-13 00:56:48.846511: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +21: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +21: 2023-05-13 00:56:48.846507: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +29: 2023-05-13 00:56:48.846443: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +29: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +29: 2023-05-13 00:56:48.846437: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +29: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +29: 2023-05-13 00:56:48.846452: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +14: 2023-05-13 00:56:48.846407: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +14: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +14: 2023-05-13 00:56:48.846414: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +14: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +14: 2023-05-13 00:56:48.846435: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +21: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +21: 2023-05-13 00:56:48.846510: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +21: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +21: 2023-05-13 00:56:48.846510: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +21: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +29: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +14: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +21: 2023-05-13 00:56:48.846500: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +21: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +21: 2023-05-13 00:56:48.846519: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +21: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +21: 2023-05-13 00:56:48.846499: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: 2023-05-13 00:56:48.846768: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 1: 2023-05-13 00:56:48.846781: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 1: 2023-05-13 00:56:48.846783: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +21: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: 2023-05-13 00:56:48.846806: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +30: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: 2023-05-13 00:56:48.846811: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +30: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: 2023-05-13 00:56:48.846818: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 0: 2023-05-13 00:56:48.846752: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 0: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 0: 2023-05-13 00:56:48.846768: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 0: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 0: 2023-05-13 00:56:48.846772: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 2: 2023-05-13 00:56:48.846833: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 2: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 2: 2023-05-13 00:56:48.846828: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 2: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 2: 2023-05-13 00:56:48.846835: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 1: 2023-05-13 00:56:48.846775: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 1: 2023-05-13 00:56:48.846775: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: 2023-05-13 00:56:48.846822: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +30: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: 2023-05-13 00:56:48.846827: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +30: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 0: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 0: 2023-05-13 00:56:48.846763: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 0: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 0: 2023-05-13 00:56:48.846759: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 0: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 2: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 2: 2023-05-13 00:56:48.846831: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 2: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 2: 2023-05-13 00:56:48.846843: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 2: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 1: 2023-05-13 00:56:48.846772: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 1: 2023-05-13 00:56:48.846772: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 1: 2023-05-13 00:56:48.846770: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +30: 2023-05-13 00:56:48.846829: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +30: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: 2023-05-13 00:56:48.846815: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +30: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: 2023-05-13 00:56:48.846815: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 0: 2023-05-13 00:56:48.846773: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 0: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 0: 2023-05-13 00:56:48.846752: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 0: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 0: 2023-05-13 00:56:48.846755: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 2: 2023-05-13 00:56:48.846823: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 2: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 2: 2023-05-13 00:56:48.846836: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 2: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 2: 2023-05-13 00:56:48.846838: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 1: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +30: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 0: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 2: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 4: 2023-05-13 00:56:48.847726: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 4: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 4: 2023-05-13 00:56:48.847735: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 4: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 4: 2023-05-13 00:56:48.847737: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 4: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 4: 2023-05-13 00:56:48.847734: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 4: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 4: 2023-05-13 00:56:48.847722: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 4: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 4: 2023-05-13 00:56:48.847728: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 4: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 4: 2023-05-13 00:56:48.847722: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 4: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 4: 2023-05-13 00:56:48.847734: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 4: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +31: 2023-05-13 00:56:48.848316: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +31: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +31: 2023-05-13 00:56:48.848334: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +31: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +31: 2023-05-13 00:56:48.848327: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +31: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +31: 2023-05-13 00:56:48.848324: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +31: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +31: 2023-05-13 00:56:48.848319: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +31: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +31: 2023-05-13 00:56:48.848316: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +31: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +31: 2023-05-13 00:56:48.848326: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +31: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +31: 2023-05-13 00:56:48.848316: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +31: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 5: 2023-05-13 00:56:48.916446: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 5: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 5: 2023-05-13 00:56:48.916461: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 5: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 5: 2023-05-13 00:56:48.916454: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 5: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 5: 2023-05-13 00:56:48.916469: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 5: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 5: 2023-05-13 00:56:48.916479: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 5: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 5: 2023-05-13 00:56:48.916476: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 5: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 5: 2023-05-13 00:56:48.916482: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 5: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 5: 2023-05-13 00:56:48.916486: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 5: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +15: 2023-05-13 00:56:48.917098: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +15: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +15: 2023-05-13 00:56:48.917104: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +15: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +15: 2023-05-13 00:56:48.917097: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +15: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +15: 2023-05-13 00:56:48.917100: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +15: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +15: 2023-05-13 00:56:48.917106: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +15: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +15: 2023-05-13 00:56:48.917091: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +15: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +15: 2023-05-13 00:56:48.917091: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +15: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +15: 2023-05-13 00:56:48.917099: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +15: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +17: 2023-05-13 00:56:48.918312: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +17: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +17: 2023-05-13 00:56:48.918321: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +17: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +17: 2023-05-13 00:56:48.918324: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +17: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +17: 2023-05-13 00:56:48.918325: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +17: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +17: 2023-05-13 00:56:48.918329: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +17: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +17: 2023-05-13 00:56:48.918330: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +17: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +17: 2023-05-13 00:56:48.918309: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +17: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +17: 2023-05-13 00:56:48.918337: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +17: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +25: 2023-05-13 00:56:48.926903: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +25: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +25: 2023-05-13 00:56:48.926911: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +25: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +25: 2023-05-13 00:56:48.926912: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +25: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +25: 2023-05-13 00:56:48.926916: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +25: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +25: 2023-05-13 00:56:48.926913: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +25: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +22: 2023-05-13 00:56:48.926922: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +22: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +22: 2023-05-13 00:56:48.926930: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +22: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +22: 2023-05-13 00:56:48.926928: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +25: 2023-05-13 00:56:48.926917: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +25: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +25: 2023-05-13 00:56:48.926919: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +25: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +25: 2023-05-13 00:56:48.926915: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +22: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +22: 2023-05-13 00:56:48.926916: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +22: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +22: 2023-05-13 00:56:48.926936: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +22: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +25: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +22: 2023-05-13 00:56:48.926946: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +22: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +22: 2023-05-13 00:56:48.926940: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +22: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +22: 2023-05-13 00:56:48.926960: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +22: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: 2023-05-13 00:56:49.004640: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +26: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: 2023-05-13 00:56:49.004647: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +26: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: 2023-05-13 00:56:49.004647: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: 2023-05-13 00:56:49.004812: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +20: 2023-05-13 00:56:49.004818: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +20: 2023-05-13 00:56:49.004820: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +20: 2023-05-13 00:56:49.004823: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +20: 2023-05-13 00:56:49.004825: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: 2023-05-13 00:56:49.004641: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +26: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: 2023-05-13 00:56:49.004634: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +26: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +20: 2023-05-13 00:56:49.004825: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +20: 2023-05-13 00:56:49.004829: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +20: 2023-05-13 00:56:49.004834: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +26: 2023-05-13 00:56:49.004636: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +26: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: 2023-05-13 00:56:49.004634: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +26: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: 2023-05-13 00:56:49.004655: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +20: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +26: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 3: 2023-05-13 00:56:49.073859: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 3: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 3: 2023-05-13 00:56:49.073871: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 3: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 3: 2023-05-13 00:56:49.073863: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 3: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 3: 2023-05-13 00:56:49.073865: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 3: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 3: 2023-05-13 00:56:49.073859: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 3: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 3: 2023-05-13 00:56:49.073865: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 3: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 3: 2023-05-13 00:56:49.073870: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 3: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 3: 2023-05-13 00:56:49.073867: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 3: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +19: 2023-05-13 00:56:49.077786: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +19: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +19: 2023-05-13 00:56:49.077789: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +19: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +19: 2023-05-13 00:56:49.077788: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +19: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +19: 2023-05-13 00:56:49.077777: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +19: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +19: 2023-05-13 00:56:49.077794: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +19: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +19: 2023-05-13 00:56:49.077784: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +19: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +19: 2023-05-13 00:56:49.077796: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +19: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +19: 2023-05-13 00:56:49.077777: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +19: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +24: 2023-05-13 00:56:49.079508: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +24: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +24: 2023-05-13 00:56:49.079524: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +24: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +24: 2023-05-13 00:56:49.079532: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +24: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +24: 2023-05-13 00:56:49.079532: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +24: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +24: 2023-05-13 00:56:49.079534: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +24: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +24: 2023-05-13 00:56:49.079538: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +24: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +24: 2023-05-13 00:56:49.079541: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +24: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +24: 2023-05-13 00:56:49.079545: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +24: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 8: 2023-05-13 00:56:49.095401: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 8: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 8: 2023-05-13 00:56:49.095388: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 8: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 8: 2023-05-13 00:56:49.095401: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +23: 2023-05-13 00:56:49.095389: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +23: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +23: 2023-05-13 00:56:49.095390: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +23: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +23: 2023-05-13 00:56:49.095422: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 8: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 8: 2023-05-13 00:56:49.095402: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 8: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 8: 2023-05-13 00:56:49.095404: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 8: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +23: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +23: 2023-05-13 00:56:49.095425: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +23: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +23: 2023-05-13 00:56:49.095432: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +23: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 8: 2023-05-13 00:56:49.095390: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 8: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 8: 2023-05-13 00:56:49.095403: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 8: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 8: 2023-05-13 00:56:49.095389: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +23: 2023-05-13 00:56:49.095416: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +23: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +23: 2023-05-13 00:56:49.095433: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +23: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +23: 2023-05-13 00:56:49.095419: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 8: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +23: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 9: 2023-05-13 00:56:49.095867: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 9: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 9: 2023-05-13 00:56:49.095854: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 9: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 9: 2023-05-13 00:56:49.095868: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 9: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 9: 2023-05-13 00:56:49.095870: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 9: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 9: 2023-05-13 00:56:49.095856: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 9: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 9: 2023-05-13 00:56:49.095879: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 9: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 9: 2023-05-13 00:56:49.095881: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 9: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 9: 2023-05-13 00:56:49.095855: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 9: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +10: 2023-05-13 00:56:49.250140: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +10: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +10: 2023-05-13 00:56:49.250145: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +10: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +10: 2023-05-13 00:56:49.250158: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +12: 2023-05-13 00:56:49.250212: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +12: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: 2023-05-13 00:56:49.250224: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +12: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: 2023-05-13 00:56:49.250218: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +10: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +10: 2023-05-13 00:56:49.250158: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +10: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +10: 2023-05-13 00:56:49.250141: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +10: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: 2023-05-13 00:56:49.250232: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +12: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: 2023-05-13 00:56:49.250236: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +12: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +10: 2023-05-13 00:56:49.250169: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +10: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +10: 2023-05-13 00:56:49.250159: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +10: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +10: 2023-05-13 00:56:49.250149: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +12: 2023-05-13 00:56:49.250226: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +12: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: 2023-05-13 00:56:49.250243: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +12: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: 2023-05-13 00:56:49.250250: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +10: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 7: 2023-05-13 00:56:49.250742: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 7: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 7: 2023-05-13 00:56:49.250756: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 7: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 7: 2023-05-13 00:56:49.250756: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 7: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 7: 2023-05-13 00:56:49.250755: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 7: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 7: 2023-05-13 00:56:49.250757: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 7: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 7: 2023-05-13 00:56:49.250765: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 7: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 7: 2023-05-13 00:56:49.250748: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 7: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 7: 2023-05-13 00:56:49.250748: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +18: 2023-05-13 00:56:49.250996: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +18: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +18: 2023-05-13 00:56:49.251002: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +18: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +18: 2023-05-13 00:56:49.250994: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +16: 2023-05-13 00:56:49.250460: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +16: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +16: 2023-05-13 00:56:49.250478: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +16: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +16: 2023-05-13 00:56:49.250465: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 7: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +18: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +18: 2023-05-13 00:56:49.250992: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +18: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +18: 2023-05-13 00:56:49.251004: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +18: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +16: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +16: 2023-05-13 00:56:49.250463: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +16: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +16: 2023-05-13 00:56:49.250459: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +16: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +18: 2023-05-13 00:56:49.251005: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +18: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +18: 2023-05-13 00:56:49.251007: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +18: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +18: 2023-05-13 00:56:49.251004: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +16: 2023-05-13 00:56:49.250456: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +16: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +16: 2023-05-13 00:56:49.250467: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +16: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +16: 2023-05-13 00:56:49.250468: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +18: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +16: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +27: 2023-05-13 00:56:49.251407: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +27: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +27: 2023-05-13 00:56:49.251412: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +27: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +27: 2023-05-13 00:56:49.251416: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +27: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +27: 2023-05-13 00:56:49.251416: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +27: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +27: 2023-05-13 00:56:49.251421: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +27: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +27: 2023-05-13 00:56:49.251419: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +27: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +27: 2023-05-13 00:56:49.251427: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +27: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +27: 2023-05-13 00:56:49.251416: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +27: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +11: 2023-05-13 00:56:49.252027: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +11: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +11: 2023-05-13 00:56:49.252035: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +11: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +11: 2023-05-13 00:56:49.252037: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +11: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +11: 2023-05-13 00:56:49.252038: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +11: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +11: 2023-05-13 00:56:49.252040: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +11: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +11: 2023-05-13 00:56:49.252022: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +11: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +11: 2023-05-13 00:56:49.252037: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +11: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +11: 2023-05-13 00:56:49.252029: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +11: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 6: 2023-05-13 00:56:49.329999: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 6: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 6: 2023-05-13 00:56:49.330011: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 6: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 6: 2023-05-13 00:56:49.330008: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 6: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 6: 2023-05-13 00:56:49.330009: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 6: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 6: 2023-05-13 00:56:49.330003: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 6: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 6: 2023-05-13 00:56:49.330000: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 6: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 6: 2023-05-13 00:56:49.329999: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 6: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. + 6: 2023-05-13 00:56:49.330014: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA + 6: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +28: 2023-05-13 00:56:49.619673: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +28: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +28: 2023-05-13 00:56:49.619668: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +28: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +28: 2023-05-13 00:56:49.619666: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +28: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +28: 2023-05-13 00:56:49.619676: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +28: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +28: 2023-05-13 00:56:49.619686: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +28: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +28: 2023-05-13 00:56:49.619686: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +28: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +28: 2023-05-13 00:56:49.619688: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +28: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +28: 2023-05-13 00:56:49.619676: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +28: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +13: 2023-05-13 00:56:49.619988: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +13: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +13: 2023-05-13 00:56:49.619993: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +13: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +13: 2023-05-13 00:56:49.619993: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +13: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +13: 2023-05-13 00:56:49.619995: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +13: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +13: 2023-05-13 00:56:49.619992: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +13: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +13: 2023-05-13 00:56:49.620000: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +13: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +13: 2023-05-13 00:56:49.619990: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +13: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +13: 2023-05-13 00:56:49.619990: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA +13: To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags. +12: 2023-05-13 00:56:58.800054: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800130: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800075: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800181: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800097: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800190: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800109: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800217: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800119: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800228: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800140: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800227: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800130: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800233: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800105: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800257: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800821: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +12: 2023-05-13 00:56:58.800838: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +22: 2023-05-13 00:56:58.800903: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +31: 2023-05-13 00:56:58.800459: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800851: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +12: 2023-05-13 00:56:58.800859: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +12: 2023-05-13 00:56:58.800867: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +31: 2023-05-13 00:56:58.800489: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800865: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +12: 2023-05-13 00:56:58.800874: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +22: 2023-05-13 00:56:58.800925: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +22: 2023-05-13 00:56:58.800931: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +31: 2023-05-13 00:56:58.800507: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:56:58.800888: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +22: 2023-05-13 00:56:58.800944: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +31: 2023-05-13 00:56:58.800573: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.800583: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800954: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +31: 2023-05-13 00:56:58.800591: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800965: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +31: 2023-05-13 00:56:58.800604: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.800651: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:56:58.800979: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +22: 2023-05-13 00:56:58.800978: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +31: 2023-05-13 00:56:58.800626: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.800628: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:56:58.800608: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:56:58.800464: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.800671: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:56:58.800504: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.800991: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.800603: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.800692: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:56:58.801314: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.800514: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.800650: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.800724: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:56:58.800560: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801008: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.800629: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.800715: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:56:58.800846: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:56:58.801338: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.800573: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801031: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.800669: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.800744: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:56:58.800911: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:56:58.801352: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +31: 2023-05-13 00:56:58.801363: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.800573: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801046: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.800667: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.801340: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 7: 2023-05-13 00:56:58.801360: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.800904: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:56:58.801376: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.800588: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801047: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.800709: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.801377: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.800919: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:56:58.801388: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.800588: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801061: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.800696: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.801389: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 7: 2023-05-13 00:56:58.801399: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 7: 2023-05-13 00:56:58.801405: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.800940: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:56:58.801398: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.801223: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.801243: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +25: 2023-05-13 00:56:58.801053: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.800724: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:56:58.801416: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 7: 2023-05-13 00:56:58.801415: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.800962: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:56:58.801406: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.801254: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +25: 2023-05-13 00:56:58.801070: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:56:58.801410: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +27: 2023-05-13 00:56:58.801422: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.800969: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:56:58.801275: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +19: 2023-05-13 00:56:58.801287: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +25: 2023-05-13 00:56:58.801622: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +25: 2023-05-13 00:56:58.801642: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +27: 2023-05-13 00:56:58.801435: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.800979: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:56:58.801297: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +25: 2023-05-13 00:56:58.801656: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.801509: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801186: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:56:58.801298: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +14: 2023-05-13 00:56:58.801136: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801683: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +27: 2023-05-13 00:56:58.801475: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +27: 2023-05-13 00:56:58.801487: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +27: 2023-05-13 00:56:58.801494: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.801531: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801240: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:56:58.801306: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +16: 2023-05-13 00:56:58.800860: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:56:58.801172: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801690: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +25: 2023-05-13 00:56:58.801692: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +27: 2023-05-13 00:56:58.801509: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.801159: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:56:58.801241: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:56:58.800897: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:56:58.801210: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801705: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +27: 2023-05-13 00:56:58.801511: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.801387: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:56:58.801543: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +15: 2023-05-13 00:56:58.801549: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801275: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:56:58.800907: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:56:58.801244: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:56:58.801709: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.801414: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:56:58.801179: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:56:58.801191: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:56:58.801563: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801298: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:56:58.800914: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:56:58.801259: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:56:58.801440: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:56:58.801212: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:56:58.801208: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:56:58.801321: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:56:58.801573: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801291: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:56:58.800923: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:56:58.801265: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:56:58.801445: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:56:58.801244: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:56:58.801235: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:56:58.801585: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801295: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:56:58.800894: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:56:58.801280: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:56:58.801461: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:56:58.801266: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:56:58.801253: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:56:58.801362: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:56:58.801591: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801340: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:56:58.800927: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:56:58.801294: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:56:58.801481: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:56:58.801282: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:56:58.801260: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:56:58.801413: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:56:58.801894: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801898: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +16: 2023-05-13 00:56:58.801022: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:56:58.802026: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +14: 2023-05-13 00:56:58.802042: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.801460: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:56:58.801288: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:56:58.801290: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:56:58.801461: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:56:58.801901: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +16: 2023-05-13 00:56:58.801547: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +14: 2023-05-13 00:56:58.802056: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +14: 2023-05-13 00:56:58.802065: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +14: 2023-05-13 00:56:58.802070: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +14: 2023-05-13 00:56:58.802072: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.801491: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:56:58.801310: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:56:58.801264: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:56:58.801390: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:56:58.801905: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801910: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801912: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:56:58.801916: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +14: 2023-05-13 00:56:58.802079: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +14: 2023-05-13 00:56:58.802089: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.801301: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:56:58.801501: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:56:58.801920: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.802064: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.801466: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:56:58.801567: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.802311: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.802330: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.802084: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.801475: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:56:58.801590: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.802091: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.802094: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +16: 2023-05-13 00:56:58.801602: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +16: 2023-05-13 00:56:58.801603: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +16: 2023-05-13 00:56:58.801601: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.802343: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +16: 2023-05-13 00:56:58.801616: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +16: 2023-05-13 00:56:58.801618: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.802354: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.802358: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.802376: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.802372: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +20: 2023-05-13 00:56:58.802386: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.802115: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.802118: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.802131: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.802151: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.802128: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.802181: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 3: 2023-05-13 00:56:58.802145: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.802164: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.802182: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.802192: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.802195: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.802203: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.802198: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 2: 2023-05-13 00:56:58.802208: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.802216: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.802230: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.802238: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.802242: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.802254: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 1: 2023-05-13 00:56:58.802267: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +13: 2023-05-13 00:56:58.802040: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802076: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802096: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802143: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802113: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802143: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802055: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802162: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802146: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802098: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802145: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802168: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802115: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802180: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802720: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +13: 2023-05-13 00:56:58.802739: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +26: 2023-05-13 00:56:58.802182: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802203: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:56:58.802750: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +13: 2023-05-13 00:56:58.802763: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +13: 2023-05-13 00:56:58.802771: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +13: 2023-05-13 00:56:58.802775: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +13: 2023-05-13 00:56:58.802770: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +13: 2023-05-13 00:56:58.802788: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +23: 2023-05-13 00:56:58.802511: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802882: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +26: 2023-05-13 00:56:58.802902: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +26: 2023-05-13 00:56:58.802926: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +23: 2023-05-13 00:56:58.802527: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:56:58.802545: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:56:58.802553: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802940: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +23: 2023-05-13 00:56:58.802560: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802964: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +26: 2023-05-13 00:56:58.802971: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +23: 2023-05-13 00:56:58.802563: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802982: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +23: 2023-05-13 00:56:58.802577: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:56:58.802572: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:56:58.802649: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.802482: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:56:58.802986: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +23: 2023-05-13 00:56:58.803066: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.802673: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.802501: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:56:58.803083: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.802679: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.802509: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:56:58.802696: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.802522: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:56:58.803099: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +23: 2023-05-13 00:56:58.803108: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.802709: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.802530: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:56:58.803120: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.802717: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:56:58.802635: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.802541: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:56:58.802736: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.802538: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:56:58.803136: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +23: 2023-05-13 00:56:58.803140: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.802726: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.802534: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:56:58.803148: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.803228: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.802651: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.803108: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.803247: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.802661: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:56:58.802673: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:56:58.802681: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:56:58.803263: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.802684: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:56:58.803274: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.802697: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:56:58.803283: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.802689: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.803128: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +28: 2023-05-13 00:56:58.803136: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +28: 2023-05-13 00:56:58.803147: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +28: 2023-05-13 00:56:58.803155: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +28: 2023-05-13 00:56:58.803164: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.803294: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.803297: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +21: 2023-05-13 00:56:58.803300: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.802769: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.802768: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:56:58.803168: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +28: 2023-05-13 00:56:58.803173: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 8: 2023-05-13 00:56:58.802788: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.802802: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.802819: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:56:58.802785: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.802829: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:56:58.802795: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:56:58.803318: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.803334: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 8: 2023-05-13 00:56:58.802825: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:56:58.802811: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.802846: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:56:58.802816: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:56:58.803345: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 8: 2023-05-13 00:56:58.802852: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:56:58.802830: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:56:58.803362: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.803365: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.803370: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +30: 2023-05-13 00:56:58.803375: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.802830: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:56:58.802822: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:56:58.803380: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.803430: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.803447: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.803457: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.803471: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.803477: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.803479: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.803491: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 5: 2023-05-13 00:56:58.803506: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 8: 2023-05-13 00:56:58.803629: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +11: 2023-05-13 00:56:58.802693: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:56:58.802819: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.803650: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 8: 2023-05-13 00:56:58.803662: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.802840: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:56:58.802722: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:56:58.802851: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:56:58.802738: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.802881: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:56:58.802888: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.803682: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +11: 2023-05-13 00:56:58.802742: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:56:58.802843: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:56:58.802918: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.803690: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 8: 2023-05-13 00:56:58.803691: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +11: 2023-05-13 00:56:58.802749: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.803702: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +11: 2023-05-13 00:56:58.802770: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.802905: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:56:58.803068: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:56:58.803059: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:56:58.803707: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +11: 2023-05-13 00:56:58.802760: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.802913: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:56:58.802865: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:56:58.802785: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.802928: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:56:58.802875: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:56:58.803091: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:56:58.803089: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.802936: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:56:58.802902: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:56:58.803106: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:56:58.803079: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.802938: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:56:58.802914: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:56:58.803117: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:56:58.803115: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.802959: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:56:58.802910: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:56:58.803131: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:56:58.803130: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.802952: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:56:58.802928: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:56:58.803139: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:56:58.803121: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:56:58.802914: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:56:58.803151: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:56:58.803144: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:56:58.803194: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:56:58.803074: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:56:58.803142: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:56:58.803131: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:56:58.803845: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.803093: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:56:58.803214: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:56:58.803105: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:56:58.803869: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +11: 2023-05-13 00:56:58.803879: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.803540: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:56:58.803225: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:56:58.803121: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:56:58.803900: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.803242: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:56:58.803129: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:56:58.803553: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:56:58.803251: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:56:58.803132: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:56:58.803565: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:56:58.803261: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:56:58.803149: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:56:58.803910: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +11: 2023-05-13 00:56:58.803917: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +11: 2023-05-13 00:56:58.803924: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.803574: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:56:58.803266: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:56:58.803139: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:56:58.803938: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.803581: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:56:58.803248: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:56:58.803578: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:56:58.803589: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:56:58.803593: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:56:58.804171: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +10: 2023-05-13 00:56:58.804193: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 9: 2023-05-13 00:56:58.804123: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 9: 2023-05-13 00:56:58.804145: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +17: 2023-05-13 00:56:58.804308: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +17: 2023-05-13 00:56:58.804330: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +10: 2023-05-13 00:56:58.804203: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 4: 2023-05-13 00:56:58.804323: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 4: 2023-05-13 00:56:58.804344: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +10: 2023-05-13 00:56:58.804222: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +10: 2023-05-13 00:56:58.804229: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +10: 2023-05-13 00:56:58.804237: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +10: 2023-05-13 00:56:58.804246: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +10: 2023-05-13 00:56:58.804247: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +17: 2023-05-13 00:56:58.804340: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 9: 2023-05-13 00:56:58.804155: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +17: 2023-05-13 00:56:58.804368: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 4: 2023-05-13 00:56:58.804370: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 9: 2023-05-13 00:56:58.804188: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 9: 2023-05-13 00:56:58.804187: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +17: 2023-05-13 00:56:58.804379: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +17: 2023-05-13 00:56:58.804378: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 9: 2023-05-13 00:56:58.804208: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 9: 2023-05-13 00:56:58.804208: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 9: 2023-05-13 00:56:58.804211: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 4: 2023-05-13 00:56:58.804380: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 4: 2023-05-13 00:56:58.804401: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 4: 2023-05-13 00:56:58.804399: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 4: 2023-05-13 00:56:58.804414: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.804457: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +17: 2023-05-13 00:56:58.804396: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 4: 2023-05-13 00:56:58.804418: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +17: 2023-05-13 00:56:58.804399: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.804502: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.804522: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.804556: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.804558: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.804567: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.804503: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.804526: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.804535: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.804584: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +29: 2023-05-13 00:56:58.804594: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.804508: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.804529: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.804578: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.804570: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.804579: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.804584: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +18: 2023-05-13 00:56:58.804593: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.804540: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.804561: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.804568: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.804575: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.804582: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 6: 2023-05-13 00:56:58.804584: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.802898: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:56:58.802891: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:56:58.802894: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libcudart.so.11.0'; dlerror: libcudart.so.11.0: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:56:58.804032: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.804054: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.804066: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.804075: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.804097: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.804111: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.804122: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. + 0: 2023-05-13 00:56:58.804132: I tensorflow/compiler/xla/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine. +24: 2023-05-13 00:57:26.638755: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.638809: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.638792: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.638841: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.638898: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.638801: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.638869: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.638924: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.638839: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.638878: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.638948: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.638847: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.638892: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.638958: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.638852: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.638907: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.638966: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.638883: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.638929: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.638972: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.639080: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.639124: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.639155: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.639158: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.639356: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.639390: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.639409: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.639429: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.639442: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.639459: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.639465: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.639470: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.639900: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.639938: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.639955: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.639971: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.639985: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.640002: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.640024: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.640200: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.640384: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.640418: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.640445: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.640462: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.640476: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.640488: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.640491: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.640649: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640505: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.640293: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640512: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640511: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640511: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640515: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640521: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +24: 2023-05-13 00:57:26.640517: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.640329: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.640566: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640526: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +24: 2023-05-13 00:57:26.640515: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.640357: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640520: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640534: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.640364: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640535: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +24: 2023-05-13 00:57:26.640536: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +24: 2023-05-13 00:57:26.640537: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.640373: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +24: 2023-05-13 00:57:26.640539: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +24: 2023-05-13 00:57:26.640539: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +30: 2023-05-13 00:57:26.640724: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.640375: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.640567: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.640587: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.640792: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640727: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640729: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640730: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.640597: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.640829: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640731: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.640615: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.640842: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640732: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.640657: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.640875: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640736: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.640672: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.640884: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640737: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640742: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.640703: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.640887: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640741: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +30: 2023-05-13 00:57:26.640744: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +30: 2023-05-13 00:57:26.640748: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.640736: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.641080: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640750: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +30: 2023-05-13 00:57:26.640751: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +30: 2023-05-13 00:57:26.640749: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.640768: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +30: 2023-05-13 00:57:26.640749: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.641084: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641058: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641060: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641061: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641064: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.641157: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641062: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641065: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641068: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641070: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641091: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641160: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.641172: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +31: 2023-05-13 00:57:26.641092: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +31: 2023-05-13 00:57:26.641092: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +31: 2023-05-13 00:57:26.641093: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641164: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +31: 2023-05-13 00:57:26.641094: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +31: 2023-05-13 00:57:26.641095: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +31: 2023-05-13 00:57:26.641095: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641171: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.641182: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +31: 2023-05-13 00:57:26.641092: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641175: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.641186: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641194: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641187: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.641187: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.641199: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641195: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 2: 2023-05-13 00:57:26.641213: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641214: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 2: 2023-05-13 00:57:26.641218: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +25: 2023-05-13 00:57:26.641684: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.641685: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.641694: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.641700: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +25: 2023-05-13 00:57:26.641701: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +25: 2023-05-13 00:57:26.641697: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.641696: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.641700: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.641700: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.641714: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +25: 2023-05-13 00:57:26.641705: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +25: 2023-05-13 00:57:26.641722: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +25: 2023-05-13 00:57:26.641723: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +25: 2023-05-13 00:57:26.641722: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +25: 2023-05-13 00:57:26.641724: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +25: 2023-05-13 00:57:26.641725: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.642210: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.642211: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.642211: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.642215: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.642218: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.642218: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.642222: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.642221: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 3: 2023-05-13 00:57:26.642245: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.642246: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.642244: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.642245: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.642246: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.642247: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.642246: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 3: 2023-05-13 00:57:26.642248: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.646699: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.646720: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.646727: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.646738: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.646744: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.646749: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.646753: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.647037: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.647008: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.647029: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.647040: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.647053: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.647061: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.647065: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.647069: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.647082: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.648087: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648428: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.648344: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.648107: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648431: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.648117: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.648359: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648432: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.648133: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.648364: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648429: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648443: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.648141: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.648381: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648439: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.648141: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.648386: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648440: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.648157: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.648393: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648438: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648446: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.648158: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.648405: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648448: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +14: 2023-05-13 00:57:26.648441: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.648510: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +14: 2023-05-13 00:57:26.648450: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +14: 2023-05-13 00:57:26.648458: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +14: 2023-05-13 00:57:26.648459: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +14: 2023-05-13 00:57:26.648460: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +14: 2023-05-13 00:57:26.648463: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.648472: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.648477: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.648482: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.648480: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.648482: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.648484: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.648486: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.648492: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.648492: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.648497: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.648491: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 5: 2023-05-13 00:57:26.648500: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.648501: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.648502: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.648503: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 5: 2023-05-13 00:57:26.648508: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +23: 2023-05-13 00:57:26.649294: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.649293: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.649294: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.649293: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.649295: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.649298: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.649300: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.649302: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +23: 2023-05-13 00:57:26.649310: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +23: 2023-05-13 00:57:26.649310: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +23: 2023-05-13 00:57:26.649318: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +23: 2023-05-13 00:57:26.649319: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +23: 2023-05-13 00:57:26.649318: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +23: 2023-05-13 00:57:26.649320: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +23: 2023-05-13 00:57:26.649321: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +23: 2023-05-13 00:57:26.649319: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.649779: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.649780: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.649782: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.649783: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.649786: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.649787: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.649789: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.649791: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 9: 2023-05-13 00:57:26.649811: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.649812: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.649812: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.649813: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.649814: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.649814: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.649812: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 9: 2023-05-13 00:57:26.649814: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +29: 2023-05-13 00:57:26.652519: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.652551: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.652566: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.652593: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.652600: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.652610: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.652618: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.652806: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.652910: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.652931: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.652940: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.652951: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.652955: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.653131: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.653132: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.653149: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.653321: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.653342: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.653353: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.653380: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.653383: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.653384: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.653464: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.653487: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654322: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654325: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654338: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +29: 2023-05-13 00:57:26.654327: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654328: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654328: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654333: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654339: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654350: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +29: 2023-05-13 00:57:26.654351: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +29: 2023-05-13 00:57:26.654343: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +29: 2023-05-13 00:57:26.654353: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +29: 2023-05-13 00:57:26.654353: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +29: 2023-05-13 00:57:26.654355: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +29: 2023-05-13 00:57:26.654362: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +29: 2023-05-13 00:57:26.654363: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +10: 2023-05-13 00:57:26.654352: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.654367: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +10: 2023-05-13 00:57:26.654363: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.654363: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.654365: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.654367: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.654370: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.654371: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.654376: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +10: 2023-05-13 00:57:26.654389: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +10: 2023-05-13 00:57:26.654389: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +10: 2023-05-13 00:57:26.654391: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +10: 2023-05-13 00:57:26.654392: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +10: 2023-05-13 00:57:26.654393: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +10: 2023-05-13 00:57:26.654394: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +10: 2023-05-13 00:57:26.654396: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 1: 2023-05-13 00:57:26.654826: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.654829: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.654829: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.654832: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.654832: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.654835: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.654837: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.654839: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 1: 2023-05-13 00:57:26.654856: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 1: 2023-05-13 00:57:26.654856: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 1: 2023-05-13 00:57:26.654859: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 1: 2023-05-13 00:57:26.654858: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 1: 2023-05-13 00:57:26.654859: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 1: 2023-05-13 00:57:26.654860: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 1: 2023-05-13 00:57:26.654861: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 1: 2023-05-13 00:57:26.654859: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +22: 2023-05-13 00:57:26.655157: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.655201: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.655206: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.655227: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.655234: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.655440: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.655443: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.655460: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656177: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656194: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +22: 2023-05-13 00:57:26.656195: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656197: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656199: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656204: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656203: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656218: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +22: 2023-05-13 00:57:26.656212: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656212: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656225: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +22: 2023-05-13 00:57:26.656226: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +22: 2023-05-13 00:57:26.656230: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +22: 2023-05-13 00:57:26.656230: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.655788: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +22: 2023-05-13 00:57:26.656238: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +22: 2023-05-13 00:57:26.656239: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.655831: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.655842: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.655871: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.655873: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.655884: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.655891: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656115: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656789: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656804: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.656816: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656817: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656822: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656823: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656827: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656827: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656840: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.656830: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +16: 2023-05-13 00:57:26.656840: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.656844: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.656845: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.656847: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.656850: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +16: 2023-05-13 00:57:26.656850: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +13: 2023-05-13 00:57:26.669926: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.669953: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.669974: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.669982: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.669991: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.669997: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.670202: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.670211: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.670442: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.670475: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.670852: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.670498: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.670515: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.670529: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.670889: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.670535: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.670908: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.670552: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.670814: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.670922: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.670559: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.670940: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.670953: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.670958: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.670893: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.671028: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.670840: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.670863: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.670875: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.670924: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.670887: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.670942: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.670898: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.670968: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.670903: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.670986: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.671097: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.670998: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.671018: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.671030: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.671606: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.671631: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.671626: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.671643: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.671652: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.671662: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.671667: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.671672: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.671683: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.671893: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671900: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.671715: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.671912: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671901: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.671731: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.671921: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671903: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.671754: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.671935: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671906: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.671773: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.671948: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671907: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.671778: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.671958: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671906: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.671782: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.671959: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671909: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.671967: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.671975: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671908: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +13: 2023-05-13 00:57:26.671920: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +13: 2023-05-13 00:57:26.671921: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +13: 2023-05-13 00:57:26.671921: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +13: 2023-05-13 00:57:26.671921: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +13: 2023-05-13 00:57:26.671923: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +13: 2023-05-13 00:57:26.671924: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +13: 2023-05-13 00:57:26.671925: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +13: 2023-05-13 00:57:26.671926: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.672075: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672467: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672482: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +21: 2023-05-13 00:57:26.672477: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672478: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.672110: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672479: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.672124: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672482: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.672154: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672485: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.672160: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672487: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672501: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.672167: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672488: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672502: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.672219: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672503: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +21: 2023-05-13 00:57:26.672505: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +21: 2023-05-13 00:57:26.672506: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.672228: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +21: 2023-05-13 00:57:26.672508: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +21: 2023-05-13 00:57:26.672512: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +15: 2023-05-13 00:57:26.672565: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672567: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672568: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672570: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672572: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672573: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672565: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672577: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672596: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +15: 2023-05-13 00:57:26.672597: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +15: 2023-05-13 00:57:26.672596: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +15: 2023-05-13 00:57:26.672597: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +15: 2023-05-13 00:57:26.672598: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +15: 2023-05-13 00:57:26.672599: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +15: 2023-05-13 00:57:26.672599: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +28: 2023-05-13 00:57:26.672788: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +15: 2023-05-13 00:57:26.672598: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672824: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672794: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672794: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672795: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.672999: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672798: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672806: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672825: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672799: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.672826: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672799: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.672830: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.673000: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672801: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672813: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672827: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.673004: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672814: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +28: 2023-05-13 00:57:26.672813: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +28: 2023-05-13 00:57:26.672814: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672833: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.673001: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +28: 2023-05-13 00:57:26.672817: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +28: 2023-05-13 00:57:26.672818: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +28: 2023-05-13 00:57:26.672819: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672837: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.673003: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.672836: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.672855: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673006: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.672855: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672856: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672856: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673009: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +18: 2023-05-13 00:57:26.673015: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672856: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672859: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 8: 2023-05-13 00:57:26.672859: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673015: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673011: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 8: 2023-05-13 00:57:26.672856: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673020: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673023: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673022: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673024: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673026: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +18: 2023-05-13 00:57:26.673029: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 4: 2023-05-13 00:57:26.673101: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673102: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673105: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673109: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673109: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673114: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673116: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673136: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673224: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.673238: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 4: 2023-05-13 00:57:26.673136: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 4: 2023-05-13 00:57:26.673137: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 4: 2023-05-13 00:57:26.673137: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673236: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673137: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 4: 2023-05-13 00:57:26.673138: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 4: 2023-05-13 00:57:26.673137: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673239: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673257: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.673243: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 4: 2023-05-13 00:57:26.673270: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673244: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.673190: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.673247: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.673250: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.673260: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673243: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 6: 2023-05-13 00:57:26.673263: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673266: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673267: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +27: 2023-05-13 00:57:26.673199: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.673214: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673268: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673270: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 6: 2023-05-13 00:57:26.673273: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +27: 2023-05-13 00:57:26.673205: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.673222: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +27: 2023-05-13 00:57:26.673205: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.673210: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.673210: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.673215: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.673215: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +27: 2023-05-13 00:57:26.673247: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +27: 2023-05-13 00:57:26.673249: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +27: 2023-05-13 00:57:26.673250: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +27: 2023-05-13 00:57:26.673252: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +27: 2023-05-13 00:57:26.673253: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +27: 2023-05-13 00:57:26.673254: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +17: 2023-05-13 00:57:26.675107: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.675145: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.675170: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.675189: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.675212: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.675227: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.675234: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.675302: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.675700: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.675719: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.675727: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.675739: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.675744: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.675745: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.675795: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.675972: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.676007: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.676027: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.676060: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.676072: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.676087: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.676256: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.676262: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.676212: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.676251: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.676275: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.676294: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.676706: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.676308: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.676322: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.676338: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.676339: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.676721: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.676731: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.676745: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.676750: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.676758: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.676763: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.676776: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676684: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676684: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676685: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676688: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676691: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676693: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676695: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676693: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +17: 2023-05-13 00:57:26.676715: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +17: 2023-05-13 00:57:26.676718: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +17: 2023-05-13 00:57:26.676718: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +17: 2023-05-13 00:57:26.676719: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +17: 2023-05-13 00:57:26.676718: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +17: 2023-05-13 00:57:26.676717: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +17: 2023-05-13 00:57:26.676720: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +17: 2023-05-13 00:57:26.676720: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +20: 2023-05-13 00:57:26.677983: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.677986: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.677986: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.677987: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.677990: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.677994: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.677995: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.678000: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677857: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.677872: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677727: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.677999: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +20: 2023-05-13 00:57:26.677996: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.678005: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +20: 2023-05-13 00:57:26.678005: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +20: 2023-05-13 00:57:26.678006: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677861: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.677727: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +20: 2023-05-13 00:57:26.678009: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +20: 2023-05-13 00:57:26.678013: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +20: 2023-05-13 00:57:26.678012: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677861: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.677729: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.677864: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.677731: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.677867: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.677735: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.677872: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.677737: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.677874: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.677738: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.677872: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 7: 2023-05-13 00:57:26.677886: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677743: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +11: 2023-05-13 00:57:26.677760: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677887: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677887: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677889: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677760: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677761: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677761: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677893: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677895: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 7: 2023-05-13 00:57:26.677896: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677763: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677764: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677765: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +11: 2023-05-13 00:57:26.677762: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641501: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.641525: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +12: 2023-05-13 00:57:26.640695: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.642151: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.642166: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641525: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640699: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.642160: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.641526: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640701: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.642161: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.641533: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640701: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.642169: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.641534: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640709: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.642169: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.641537: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640710: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640720: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.642168: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.641539: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640707: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640725: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.642171: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.642186: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641542: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +19: 2023-05-13 00:57:26.641563: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +12: 2023-05-13 00:57:26.640727: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +12: 2023-05-13 00:57:26.640728: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +12: 2023-05-13 00:57:26.640729: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.642172: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +26: 2023-05-13 00:57:26.642186: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641564: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641565: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641566: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +12: 2023-05-13 00:57:26.640731: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +12: 2023-05-13 00:57:26.640735: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.642193: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.642196: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.642196: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641567: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641568: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +19: 2023-05-13 00:57:26.641569: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +12: 2023-05-13 00:57:26.640967: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 +12: 2023-05-13 00:57:26.640981: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.642198: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. +26: 2023-05-13 00:57:26.642198: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: 2023-05-13 00:57:26.675806: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676744: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676744: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676745: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676748: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676751: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676753: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676754: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676757: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /pfs/lustrep2/projappl/project_462000125/samantao-public/apps-rocm-5.2.3/aws-ofi-rccl:/opt/rocm/lib64:/opt/rocm/lib:/opt/rocm/rocprofiler/lib:/opt/rocm/rocprofiler/tool:/opt/rocm/roctracer/lib:/opt/rocm/roctracer/tool:/opt/rocm/hip/lib:/opt/cray/pe/python/3.9.13.1/lib:/opt/cray/pe/gcc-libs:/opt/cray/libfabric/1.15.2.0/lib64 + 0: 2023-05-13 00:57:26.676776: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: 2023-05-13 00:57:26.676776: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: 2023-05-13 00:57:26.676775: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: 2023-05-13 00:57:26.676777: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: 2023-05-13 00:57:26.676777: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: 2023-05-13 00:57:26.676778: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: 2023-05-13 00:57:26.676780: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: 2023-05-13 00:57:26.676781: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly. + 0: Successfully preprocessed all matching files. + 0: Detected CUDA files, patching ldflags + 0: Emitting ninja build file /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/build/build.ninja... + 0: Building extension module scaled_upper_triang_masked_softmax_cuda... + 0: Allowing ninja to set a default number of workers... (overridable by setting the environment variable MAX_JOBS=N) + 0: Loading extension module scaled_upper_triang_masked_softmax_cuda... + 0: Successfully preprocessed all matching files. + 0: Detected CUDA files, patching ldflags + 0: Emitting ninja build file /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/build/build.ninja... + 0: Building extension module scaled_masked_softmax_cuda... + 0: Allowing ninja to set a default number of workers... (overridable by setting the environment variable MAX_JOBS=N) + 0: Loading extension module scaled_masked_softmax_cuda... + 0: Successfully preprocessed all matching files. + 0: Detected CUDA files, patching ldflags + 0: Emitting ninja build file /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/build/build.ninja... + 0: Building extension module fused_mix_prec_layer_norm_cuda... + 0: Allowing ninja to set a default number of workers... (overridable by setting the environment variable MAX_JOBS=N) + 0: Loading extension module fused_mix_prec_layer_norm_cuda... +30: Successfully preprocessed all matching files. +16: Successfully preprocessed all matching files. +16: Successfully preprocessed all matching files. + 6: Successfully preprocessed all matching files. + 6: Successfully preprocessed all matching files. +16: Successfully preprocessed all matching files. +12: Successfully preprocessed all matching files. +30: Successfully preprocessed all matching files. + 6: Successfully preprocessed all matching files. +28: Successfully preprocessed all matching files. +23: Successfully preprocessed all matching files. +11: Successfully preprocessed all matching files. + 0: Successfully preprocessed all matching files. + 0: Successfully preprocessed all matching files. + 0: Successfully preprocessed all matching files. +21: Successfully preprocessed all matching files. +21: Successfully preprocessed all matching files. +21: Successfully preprocessed all matching files. +12: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +12: warnings.warn( +12: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +12: warnings.warn( +12: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +12: warnings.warn( +30: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +30: warnings.warn( +30: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +30: warnings.warn( +30: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +30: warnings.warn( +30: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +30: warnings.warn( +30: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +30: warnings.warn( +16: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +16: warnings.warn( +30: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +30: warnings.warn( +30: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +30: warnings.warn( +16: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +16: warnings.warn( +21: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +21: warnings.warn( +21: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +21: warnings.warn( +21: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +21: warnings.warn( +21: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +21: warnings.warn( +21: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +21: warnings.warn( +21: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +21: warnings.warn( +16: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +16: warnings.warn( +16: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +16: warnings.warn( +16: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +16: warnings.warn( +21: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +21: warnings.warn( +16: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +16: warnings.warn( +16: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +16: warnings.warn( +12: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +12: warnings.warn( +12: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +12: warnings.warn( +21: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +21: warnings.warn( +12: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +12: warnings.warn( +12: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +12: warnings.warn( +16: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +16: warnings.warn( + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 0: warnings.warn( + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 0: warnings.warn( + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 0: warnings.warn( + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 0: warnings.warn( + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 0: warnings.warn( + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 0: warnings.warn( + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 0: warnings.warn( + 3: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 3: warnings.warn( + 3: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 3: warnings.warn( + 3: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 3: warnings.warn( + 3: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 3: warnings.warn( + 3: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 3: warnings.warn( + 3: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 3: warnings.warn( + 3: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 3: warnings.warn( + 3: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 3: warnings.warn( +23: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +23: warnings.warn( +23: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +23: warnings.warn( +23: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +23: warnings.warn( +23: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +23: warnings.warn( +23: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +23: warnings.warn( +23: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +23: warnings.warn( +23: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +23: warnings.warn( +23: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +23: warnings.warn( + 4: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 4: warnings.warn( +28: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +28: warnings.warn( +28: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +28: warnings.warn( +28: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +28: warnings.warn( + 4: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 4: warnings.warn( + 4: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 4: warnings.warn( + 4: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 4: warnings.warn( +28: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +28: warnings.warn( +28: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +28: warnings.warn( +28: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +28: warnings.warn( + 4: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 4: warnings.warn( +28: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +28: warnings.warn( + 4: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 4: warnings.warn( +28: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +28: warnings.warn( + 4: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 4: warnings.warn( + 4: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 4: warnings.warn( +13: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +13: warnings.warn( +13: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +13: warnings.warn( +13: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +13: warnings.warn( +13: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +13: warnings.warn( +13: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +13: warnings.warn( +13: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +13: warnings.warn( +20: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +20: warnings.warn( +20: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +20: warnings.warn( +20: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +20: warnings.warn( +20: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +20: warnings.warn( +20: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +20: warnings.warn( +20: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +20: warnings.warn( +20: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +20: warnings.warn( +20: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +20: warnings.warn( +30: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +30: warnings.warn( +12: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +12: warnings.warn( +27: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +27: warnings.warn( + 6: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 6: warnings.warn( +27: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +27: warnings.warn( +27: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +27: warnings.warn( +26: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +26: warnings.warn( +22: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +22: warnings.warn( +31: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +31: warnings.warn( +31: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +31: warnings.warn( +31: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +31: warnings.warn( + 6: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 6: warnings.warn( +27: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +27: warnings.warn( +27: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +27: warnings.warn( +26: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +26: warnings.warn( +22: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +22: warnings.warn( +31: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +31: warnings.warn( +14: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +14: warnings.warn( +14: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +14: warnings.warn( +14: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +14: warnings.warn( +10: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +10: warnings.warn( +10: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +10: warnings.warn( +22: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +22: warnings.warn( +22: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +22: warnings.warn( +31: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +31: warnings.warn( +31: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +31: warnings.warn( +31: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +31: warnings.warn( +14: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +14: warnings.warn( + 6: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 6: warnings.warn( + 6: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 6: warnings.warn( + 6: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 6: warnings.warn( +11: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +11: warnings.warn( +11: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +11: warnings.warn( +11: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +11: warnings.warn( +10: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +10: warnings.warn( +10: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +10: warnings.warn( +10: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +10: warnings.warn( +26: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +26: warnings.warn( +26: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +26: warnings.warn( +26: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +26: warnings.warn( +22: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +22: warnings.warn( +22: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +22: warnings.warn( +22: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +22: warnings.warn( +31: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +31: warnings.warn( +14: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +14: warnings.warn( +14: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +14: warnings.warn( +14: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +14: warnings.warn( +11: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +11: warnings.warn( +11: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +11: warnings.warn( +11: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +11: warnings.warn( +10: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +10: warnings.warn( +10: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +10: warnings.warn( +18: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +18: warnings.warn( +18: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +18: warnings.warn( + 6: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 6: warnings.warn( + 6: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 6: warnings.warn( + 2: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 2: warnings.warn( + 2: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 2: warnings.warn( + 2: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 2: warnings.warn( +11: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +11: warnings.warn( +18: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +18: warnings.warn( +26: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +26: warnings.warn( +26: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +26: warnings.warn( +22: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +22: warnings.warn( +14: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +14: warnings.warn( +18: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +18: warnings.warn( +18: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +18: warnings.warn( + 6: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 6: warnings.warn( + 2: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 2: warnings.warn( + 2: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 2: warnings.warn( + 2: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 2: warnings.warn( + 2: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 2: warnings.warn( +18: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +18: warnings.warn( +18: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +18: warnings.warn( +10: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +10: warnings.warn( +11: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +11: warnings.warn( +18: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +18: warnings.warn( + 8: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 8: warnings.warn( + 8: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 8: warnings.warn( + 8: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 8: warnings.warn( +26: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +26: warnings.warn( + 8: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 8: warnings.warn( + 8: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 8: warnings.warn( + 8: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 8: warnings.warn( + 2: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 2: warnings.warn( + 8: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 8: warnings.warn( + 8: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 8: warnings.warn( +15: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +15: warnings.warn( +15: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +15: warnings.warn( +15: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +15: warnings.warn( +15: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +15: warnings.warn( +15: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +15: warnings.warn( +15: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +15: warnings.warn( + 7: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 7: warnings.warn( + 7: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 7: warnings.warn( + 7: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 7: warnings.warn( +15: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +15: warnings.warn( + 7: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 7: warnings.warn( + 7: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 7: warnings.warn( + 7: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 7: warnings.warn( + 7: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 7: warnings.warn( + 7: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 7: warnings.warn( +15: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +15: warnings.warn( + 5: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 5: warnings.warn( + 5: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 5: warnings.warn( + 5: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 5: warnings.warn( + 5: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 5: warnings.warn( + 5: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 5: warnings.warn( + 5: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 5: warnings.warn( + 5: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 5: warnings.warn( +17: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +17: warnings.warn( + 5: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 5: warnings.warn( +17: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +17: warnings.warn( +17: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +17: warnings.warn( +17: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +17: warnings.warn( +17: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +17: warnings.warn( +17: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +17: warnings.warn( +17: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +17: warnings.warn( +19: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +19: warnings.warn( +19: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +19: warnings.warn( +19: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +19: warnings.warn( +19: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +19: warnings.warn( +19: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +19: warnings.warn( +19: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +19: warnings.warn( +19: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +19: warnings.warn( +29: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +29: warnings.warn( +29: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +29: warnings.warn( +29: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +29: warnings.warn( +29: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +29: warnings.warn( +29: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +29: warnings.warn( +29: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +29: warnings.warn( +29: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +29: warnings.warn( +29: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +29: warnings.warn( +17: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +17: warnings.warn( +19: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +19: warnings.warn( +25: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +25: warnings.warn( +25: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +25: warnings.warn( +25: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +25: warnings.warn( +25: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +25: warnings.warn( +25: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +25: warnings.warn( +25: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +25: warnings.warn( +25: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +25: warnings.warn( +25: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +25: warnings.warn( +24: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +24: warnings.warn( +24: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +24: warnings.warn( +24: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +24: warnings.warn( + 1: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 1: warnings.warn( + 1: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 1: warnings.warn( + 1: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 1: warnings.warn( + 1: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 1: warnings.warn( + 1: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 1: warnings.warn( + 1: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 1: warnings.warn( + 1: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 1: warnings.warn( + 1: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 1: warnings.warn( +24: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +24: warnings.warn( +24: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +24: warnings.warn( +24: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +24: warnings.warn( +24: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +24: warnings.warn( +13: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +13: warnings.warn( +13: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +13: warnings.warn( +24: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +24: warnings.warn( + 9: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 9: warnings.warn( + 9: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 9: warnings.warn( + 9: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 9: warnings.warn( + 9: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 9: warnings.warn( + 9: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 9: warnings.warn( + 9: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 9: warnings.warn( + 9: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 9: warnings.warn( + 9: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 9: warnings.warn( +27: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +27: warnings.warn( +27: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +27: warnings.warn( +27: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead +27: warnings.warn( + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/distributed/distributed_c10d.py:429: UserWarning: torch.distributed.distributed_c10d._get_global_rank is deprecated please use torch.distributed.distributed_c10d.get_global_rank instead + 0: warnings.warn( + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: + 0: + 0: + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 4: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 4: + 4: + 4: + 4: + 4: + 4: + 4: + 3: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 3: + 3: + 3: + 3: + 3: + 3: + 3: + 8: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: + 8: + 8: + 8: + 8: + 8: + 8: + 5: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 5: + 5: + 5: + 5: + 5: + 5: + 5: + 2: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 2: + 2: + 2: + 2: + 2: + 2: + 2: + 1: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 1: + 1: + 1: + 1: + 1: + 1: + 1: + 7: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: + 7: + 7: + 7: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: +11: +10: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: +10: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: +10: +10: +10: +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: +21: +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: +18: +18: +18: +18: +18: +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +15: +15: +15: +15: +15: +15: +15: +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: +16: +16: +16: +16: +14: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +14: +14: +14: +14: +14: +14: +14: + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: + 6: + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: + 9: + 9: + 9: + 9: + 9: +12: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +12: +12: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +12: +12: +12: +12: +12: + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: +30: +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +22: +22: +22: +22: +22: +22: +22: +17: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +17: +17: +17: +17: +17: +17: +17: +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: +13: +13: +20: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +20: +20: +20: +20: +20: +20: +20: +19: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +19: +19: +19: +19: +19: +19: +19: +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +28: +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +28: +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +28: +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: +25: +25: +25: +25: +25: +25: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: +24: +24: +24: +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +26: +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +26: +26: +26: +26: +29: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +29: +29: +29: +29: +29: +29: +29: +27: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +27: +27: +27: +27: +27: +27: +27: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: +31: +31: +31: +31: +31: +31: + 0: Emitting ninja build file /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu/utils/build.ninja... + 0: Building extension module utils... + 0: Allowing ninja to set a default number of workers... (overridable by setting the environment variable MAX_JOBS=N) + 0: Loading extension module utils... + 0: Loading extension module utils... + 0: Loading extension module utils... + 0: Loading extension module utils... + 0: Loading extension module utils... + 0: Loading extension module utils... + 0: Loading extension module utils... + 0: Loading extension module utils... + 1: Loading extension module utils... + 1: Loading extension module utils... + 1: Loading extension module utils... + 1: Loading extension module utils... + 1: Loading extension module utils... + 1: Loading extension module utils... + 1: Loading extension module utils... + 1: Loading extension module utils... +11: Loading extension module utils... + 6: Loading extension module utils... +11: Loading extension module utils... + 2: Loading extension module utils... + 3: Loading extension module utils... +11: Loading extension module utils... + 6: Loading extension module utils... + 2: Loading extension module utils... + 3: Loading extension module utils... +11: Loading extension module utils... + 5: Loading extension module utils... + 2: Loading extension module utils... + 2: Loading extension module utils... + 6: Loading extension module utils... + 8: Loading extension module utils... + 3: Loading extension module utils... +11: Loading extension module utils... + 4: Loading extension module utils... + 6: Loading extension module utils... + 2: Loading extension module utils... +29: Loading extension module utils... +30: Loading extension module utils... +11: Loading extension module utils... + 3: Loading extension module utils... +31: Loading extension module utils... + 8: Loading extension module utils... + 4: Loading extension module utils... + 2: Loading extension module utils... +10: Loading extension module utils... +30: Loading extension module utils... +29: Loading extension module utils... +16: Loading extension module utils... +25: Loading extension module utils... +21: Loading extension module utils... +16: Loading extension module utils... + 6: Loading extension module utils... + 7: Loading extension module utils... +15: Loading extension module utils... +29: Loading extension module utils... +25: Loading extension module utils... + 3: Loading extension module utils... + 8: Loading extension module utils... +18: Loading extension module utils... +24: Loading extension module utils... + 2: Loading extension module utils... + 5: Loading extension module utils... +14: Loading extension module utils... + 6: Loading extension module utils... + 4: Loading extension module utils... +26: Loading extension module utils... +31: Loading extension module utils... +30: Loading extension module utils... + 3: Loading extension module utils... +19: Loading extension module utils... +12: Loading extension module utils... +27: Loading extension module utils... + 8: Loading extension module utils... +11: Loading extension module utils... +31: Loading extension module utils... +25: Loading extension module utils... +17: Loading extension module utils... + 2: Loading extension module utils... +18: Loading extension module utils... +21: Loading extension module utils... +15: Loading extension module utils... +16: Loading extension module utils... +14: Loading extension module utils... + 4: Loading extension module utils... +10: Loading extension module utils... +30: Loading extension module utils... + 6: Loading extension module utils... +24: Loading extension module utils... + 9: Loading extension module utils... + 7: Loading extension module utils... +29: Loading extension module utils... +14: Loading extension module utils... +20: Loading extension module utils... +18: Loading extension module utils... +22: Loading extension module utils... +25: Loading extension module utils... +31: Loading extension module utils... + 8: Loading extension module utils... +30: Loading extension module utils... + 9: Loading extension module utils... +10: Loading extension module utils... +21: Loading extension module utils... +26: Loading extension module utils... +27: Loading extension module utils... + 4: Loading extension module utils... +19: Loading extension module utils... +14: Loading extension module utils... +17: Loading extension module utils... + 6: Loading extension module utils... +18: Loading extension module utils... +24: Loading extension module utils... +25: Loading extension module utils... +16: Loading extension module utils... +22: Loading extension module utils... + 5: Loading extension module utils... +28: Loading extension module utils... +15: Loading extension module utils... +23: Loading extension module utils... + 9: Loading extension module utils... + 8: Loading extension module utils... +13: Loading extension module utils... +30: Loading extension module utils... +29: Loading extension module utils... +18: Loading extension module utils... + 7: Loading extension module utils... +31: Loading extension module utils... +16: Loading extension module utils... +14: Loading extension module utils... +25: Loading extension module utils... +11: Loading extension module utils... +21: Loading extension module utils... +17: Loading extension module utils... +10: Loading extension module utils... +24: Loading extension module utils... + 3: Loading extension module utils... + 4: Loading extension module utils... + 8: Loading extension module utils... +22: Loading extension module utils... +31: Loading extension module utils... +20: Loading extension module utils... +26: Loading extension module utils... +27: Loading extension module utils... + 5: Loading extension module utils... +15: Loading extension module utils... +10: Loading extension module utils... + 8: Loading extension module utils... +18: Loading extension module utils... +19: Loading extension module utils... +14: Loading extension module utils... + 9: Loading extension module utils... +29: Loading extension module utils... + 3: Loading extension module utils... +14: Loading extension module utils... +25: Loading extension module utils... +24: Loading extension module utils... + 9: Loading extension module utils... + 4: Loading extension module utils... +30: Loading extension module utils... +18: Loading extension module utils... +16: Loading extension module utils... +17: Loading extension module utils... +26: Loading extension module utils... + 7: Loading extension module utils... +31: Loading extension module utils... +10: Loading extension module utils... +24: Loading extension module utils... +19: Loading extension module utils... +25: Loading extension module utils... +20: Loading extension module utils... +23: Loading extension module utils... +14: Loading extension module utils... +27: Loading extension module utils... +21: Loading extension module utils... +22: Loading extension module utils... +29: Loading extension module utils... +16: Loading extension module utils... + 4: Loading extension module utils... +15: Loading extension module utils... +30: Loading extension module utils... + 7: Loading extension module utils... +18: Loading extension module utils... +31: Loading extension module utils... + 9: Loading extension module utils... + 5: Loading extension module utils... +10: Loading extension module utils... +22: Loading extension module utils... +24: Loading extension module utils... +16: Loading extension module utils... +17: Loading extension module utils... +29: Loading extension module utils... +27: Loading extension module utils... +26: Loading extension module utils... + 9: Loading extension module utils... +10: Loading extension module utils... +17: Loading extension module utils... +24: Loading extension module utils... +21: Loading extension module utils... + 5: Loading extension module utils... +22: Loading extension module utils... +20: Loading extension module utils... + 7: Loading extension module utils... +26: Loading extension module utils... +15: Loading extension module utils... + 9: Loading extension module utils... +19: Loading extension module utils... +27: Loading extension module utils... +17: Loading extension module utils... +23: Loading extension module utils... +20: Loading extension module utils... +21: Loading extension module utils... +22: Loading extension module utils... +28: Loading extension module utils... +12: Loading extension module utils... + 7: Loading extension module utils... +13: Loading extension module utils... +15: Loading extension module utils... + 5: Loading extension module utils... +17: Loading extension module utils... +20: Loading extension module utils... +26: Loading extension module utils... +27: Loading extension module utils... +21: Loading extension module utils... +19: Loading extension module utils... +12: Loading extension module utils... +15: Loading extension module utils... +22: Loading extension module utils... + 7: Loading extension module utils... +20: Loading extension module utils... +26: Loading extension module utils... +27: Loading extension module utils... + 5: Loading extension module utils... +19: Loading extension module utils... +28: Loading extension module utils... +20: Loading extension module utils... +23: Loading extension module utils... +13: Loading extension module utils... +12: Loading extension module utils... +19: Loading extension module utils... +28: Loading extension module utils... +23: Loading extension module utils... +13: Loading extension module utils... +23: Loading extension module utils... +28: Loading extension module utils... +12: Loading extension module utils... +13: Loading extension module utils... +23: Loading extension module utils... +23: Loading extension module utils... +28: Loading extension module utils... +12: Loading extension module utils... +13: Loading extension module utils... +28: Loading extension module utils... +12: Loading extension module utils... +13: Loading extension module utils... +28: Loading extension module utils... +12: Loading extension module utils... +13: Loading extension module utils... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: +21: +21: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +21: No modifications detected for re-loaded extension module utils, skipping build step... +21: Loading extension module utils... +21: No modifications detected for re-loaded extension module utils, skipping build step... +21: Loading extension module utils... +21: No modifications detected for re-loaded extension module utils, skipping build step... +21: Loading extension module utils... +21: No modifications detected for re-loaded extension module utils, skipping build step... +21: Loading extension module utils... +21: No modifications detected for re-loaded extension module utils, skipping build step... +21: Loading extension module utils...No modifications detected for re-loaded extension module utils, skipping build step... +21: +21: Loading extension module utils... +21: No modifications detected for re-loaded extension module utils, skipping build step... +21: Loading extension module utils...No modifications detected for re-loaded extension module utils, skipping build step... +21: +21: Loading extension module utils... + 0: No modifications detected for re-loaded extension module utils, skipping build step... + 0: Loading extension module utils... + 0: No modifications detected for re-loaded extension module utils, skipping build step... + 0: Loading extension module utils... + 0: No modifications detected for re-loaded extension module utils, skipping build step... + 0: Loading extension module utils... +12: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +12: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +12: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +12: +12: +12: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +12: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +12: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: No modifications detected for re-loaded extension module utils, skipping build step... + 0: Loading extension module utils... + 0: No modifications detected for re-loaded extension module utils, skipping build step... + 0: No modifications detected for re-loaded extension module utils, skipping build step...Loading extension module utils... + 0: + 0: Loading extension module utils... + 0: No modifications detected for re-loaded extension module utils, skipping build step... + 0: Loading extension module utils... +12: No modifications detected for re-loaded extension module utils, skipping build step... +12: Loading extension module utils... +12: No modifications detected for re-loaded extension module utils, skipping build step... +12: Loading extension module utils... +12: No modifications detected for re-loaded extension module utils, skipping build step... +12: Loading extension module utils... +12: No modifications detected for re-loaded extension module utils, skipping build step... +12: Loading extension module utils... +12: No modifications detected for re-loaded extension module utils, skipping build step... +12: Loading extension module utils... +12: No modifications detected for re-loaded extension module utils, skipping build step... +12: Loading extension module utils... +12: No modifications detected for re-loaded extension module utils, skipping build step... +12: Loading extension module utils... +12: No modifications detected for re-loaded extension module utils, skipping build step... +12: Loading extension module utils... +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: +16: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +16: No modifications detected for re-loaded extension module utils, skipping build step... +16: Loading extension module utils... +16: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +16: +16: +16: Loading extension module utils...Loading extension module utils...Loading extension module utils...No modifications detected for re-loaded extension module utils, skipping build step... +16: +16: +16: No modifications detected for re-loaded extension module utils, skipping build step... +16: +16: Loading extension module utils... +16: Loading extension module utils... +16: No modifications detected for re-loaded extension module utils, skipping build step... +16: Loading extension module utils... +16: No modifications detected for re-loaded extension module utils, skipping build step... +16: Loading extension module utils... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +30: No modifications detected for re-loaded extension module utils, skipping build step... +30: Loading extension module utils... +30: No modifications detected for re-loaded extension module utils, skipping build step... +30: Loading extension module utils... +30: No modifications detected for re-loaded extension module utils, skipping build step... +30: Loading extension module utils... +30: No modifications detected for re-loaded extension module utils, skipping build step... +30: Loading extension module utils... +30: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +30: +30: Loading extension module utils...Loading extension module utils... +30: +30: No modifications detected for re-loaded extension module utils, skipping build step... +30: Loading extension module utils... +30: No modifications detected for re-loaded extension module utils, skipping build step... +30: Loading extension module utils... + 8: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 1: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 1: + 1: + 1: + 1: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 1: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: + 8: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: No modifications detected for re-loaded extension module utils, skipping build step... +25: Loading extension module utils... + 2: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 2: +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +24: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +15: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: No modifications detected for re-loaded extension module utils, skipping build step... +25: Loading extension module utils... + 4: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 1: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 1: +25: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: +25: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: +25: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: No modifications detected for re-loaded extension module utils, skipping build step... +25: Loading extension module utils... + 8: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: + 8: + 8: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 2: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 2: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 2: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 2: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 2: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 2: +10: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: +10: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: +10: +10: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: +13: +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +25: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +25: +25: +25: +25: +25: Loading extension module utils...Loading extension module utils...Loading extension module utils...Loading extension module utils...Loading extension module utils... +25: +25: +25: +25: +17: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: No modifications detected for re-loaded extension module utils, skipping build step... + 8: Loading extension module utils... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +18: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 4: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 4: + 4: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 4: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 4: + 4: + 4: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 1: No modifications detected for re-loaded extension module utils, skipping build step... + 1: Loading extension module utils... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 3: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 3: + 3: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: +11: +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: +11: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: +23: +23: +23: +14: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +14: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +14: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +14: +14: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +14: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +14: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +14: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +27: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: No modifications detected for re-loaded extension module utils, skipping build step... +10: Loading extension module utils... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +31: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +13: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +13: +13: Loading extension module utils...Loading extension module utils... +13: +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: + 9: + 9: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 9: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +17: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +17: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 3: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 3: + 3: + 3: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 3: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 1: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... + 1: + 1: Loading extension module utils...No modifications detected for re-loaded extension module utils, skipping build step...Loading extension module utils... + 1: + 1: + 1: Loading extension module utils... + 1: No modifications detected for re-loaded extension module utils, skipping build step... + 1: Loading extension module utils... + 1: No modifications detected for re-loaded extension module utils, skipping build step... + 1: Loading extension module utils... + 1: No modifications detected for re-loaded extension module utils, skipping build step... +23: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +23: +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +22: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +14: No modifications detected for re-loaded extension module utils, skipping build step... +14: Loading extension module utils... + 1: Loading extension module utils... + 7: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +11: No modifications detected for re-loaded extension module utils, skipping build step... +11: Loading extension module utils... +11: No modifications detected for re-loaded extension module utils, skipping build step... +11: Loading extension module utils... +11: No modifications detected for re-loaded extension module utils, skipping build step... +11: Loading extension module utils... +13: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 6: +27: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +27: +27: +27: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +27: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +27: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +27: +20: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +20: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +20: +20: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +20: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +20: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +20: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +20: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: No modifications detected for re-loaded extension module utils, skipping build step... + 8: Loading extension module utils... + 5: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 5: + 5: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: +29: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +29: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +29: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +29: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +29: +29: +29: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +29: +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: No modifications detected for re-loaded extension module utils, skipping build step... + 8: No modifications detected for re-loaded extension module utils, skipping build step...Loading extension module utils... + 8: +10: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +10: +10: +10: +10: Loading extension module utils...Loading extension module utils...Loading extension module utils... +10: Loading extension module utils... +10: +10: +10: No modifications detected for re-loaded extension module utils, skipping build step... +13: +13: +13: Loading extension module utils...Loading extension module utils... +13: Loading extension module utils... +13: +13: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +13: +13: Loading extension module utils...Loading extension module utils... +14: No modifications detected for re-loaded extension module utils, skipping build step... +14: Loading extension module utils... +14: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +14: +14: Loading extension module utils... +14: Loading extension module utils... +17: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +17: +17: +17: +17: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 5: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 7: + 7: + 7: +13: +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +28: +28: + 8: Loading extension module utils... + 8: No modifications detected for re-loaded extension module utils, skipping build step... + 8: Loading extension module utils... + 5: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 5: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: Loading extension module utils... +10: No modifications detected for re-loaded extension module utils, skipping build step... +10: Loading extension module utils... +10: No modifications detected for re-loaded extension module utils, skipping build step... +15: No modifications detected for re-loaded extension module utils, skipping build step... +15: Loading extension module utils... +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +19: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +19: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +19: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +19: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +19: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root...Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +19: +19: +19: +28: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: No modifications detected for re-loaded extension module utils, skipping build step... + 8: Loading extension module utils... + 5: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 8: No modifications detected for re-loaded extension module utils, skipping build step... + 8: Loading extension module utils... + 5: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +10: Loading extension module utils... +29: No modifications detected for re-loaded extension module utils, skipping build step... +29: Loading extension module utils... +26: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... +29: No modifications detected for re-loaded extension module utils, skipping build step... +29: No modifications detected for re-loaded extension module utils, skipping build step...Loading extension module utils... +29: +29: Loading extension module utils... +29: No modifications detected for re-loaded extension module utils, skipping build step... +29: Loading extension module utils... +29: No modifications detected for re-loaded extension module utils, skipping build step... +29: Loading extension module utils... +27: No modifications detected for re-loaded extension module utils, skipping build step... +27: Loading extension module utils... +14: No modifications detected for re-loaded extension module utils, skipping build step... +14: Loading extension module utils... +27: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +27: +13: No modifications detected for re-loaded extension module utils, skipping build step... +13: Loading extension module utils... +26: No modifications detected for re-loaded extension module utils, skipping build step... +26: Loading extension module utils... + 1: No modifications detected for re-loaded extension module utils, skipping build step... + 1: Loading extension module utils... +11: No modifications detected for re-loaded extension module utils, skipping build step... +11: Loading extension module utils... +29: No modifications detected for re-loaded extension module utils, skipping build step... +29: Loading extension module utils... +27: Loading extension module utils...Loading extension module utils... +27: + 8: No modifications detected for re-loaded extension module utils, skipping build step... + 8: Loading extension module utils... +17: No modifications detected for re-loaded extension module utils, skipping build step... +17: Loading extension module utils... +26: No modifications detected for re-loaded extension module utils, skipping build step... +26: Loading extension module utils... +29: No modifications detected for re-loaded extension module utils, skipping build step... +29: Loading extension module utils... +27: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +27: No modifications detected for re-loaded extension module utils, skipping build step... +27: Loading extension module utils... +27: Loading extension module utils... +27: +27: Loading extension module utils... +22: No modifications detected for re-loaded extension module utils, skipping build step... +22: Loading extension module utils... +29: No modifications detected for re-loaded extension module utils, skipping build step... + 3: No modifications detected for re-loaded extension module utils, skipping build step... + 3: Loading extension module utils... +11: No modifications detected for re-loaded extension module utils, skipping build step... +11: Loading extension module utils... +29: Loading extension module utils... +27: No modifications detected for re-loaded extension module utils, skipping build step... +27: Loading extension module utils... +26: No modifications detected for re-loaded extension module utils, skipping build step... +26: Loading extension module utils... +26: No modifications detected for re-loaded extension module utils, skipping build step... +26: Loading extension module utils... +27: No modifications detected for re-loaded extension module utils, skipping build step... +27: Loading extension module utils... + 3: No modifications detected for re-loaded extension module utils, skipping build step... + 3: Loading extension module utils... + 2: No modifications detected for re-loaded extension module utils, skipping build step... + 2: Loading extension module utils... +17: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +17: +17: Loading extension module utils... +17: Loading extension module utils... +26: No modifications detected for re-loaded extension module utils, skipping build step... +26: Loading extension module utils... +15: No modifications detected for re-loaded extension module utils, skipping build step... +15: Loading extension module utils... +14: No modifications detected for re-loaded extension module utils, skipping build step... +14: Loading extension module utils... + 7: No modifications detected for re-loaded extension module utils, skipping build step... + 7: Loading extension module utils... +26: No modifications detected for re-loaded extension module utils, skipping build step... +26: Loading extension module utils... +26: No modifications detected for re-loaded extension module utils, skipping build step... +26: Loading extension module utils... +17: No modifications detected for re-loaded extension module utils, skipping build step... +17: Loading extension module utils... +24: No modifications detected for re-loaded extension module utils, skipping build step... +24: Loading extension module utils... +14: No modifications detected for re-loaded extension module utils, skipping build step... +14: Loading extension module utils... +20: No modifications detected for re-loaded extension module utils, skipping build step... +20: Loading extension module utils... +26: No modifications detected for re-loaded extension module utils, skipping build step... +26: Loading extension module utils... +18: No modifications detected for re-loaded extension module utils, skipping build step... +18: Loading extension module utils... +28: No modifications detected for re-loaded extension module utils, skipping build step... +28: Loading extension module utils... +23: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +23: +23: Loading extension module utils...Loading extension module utils... +23: +22: No modifications detected for re-loaded extension module utils, skipping build step... +22: Loading extension module utils... + 3: No modifications detected for re-loaded extension module utils, skipping build step... + 3: Loading extension module utils... +23: No modifications detected for re-loaded extension module utils, skipping build step... +23: Loading extension module utils... +20: No modifications detected for re-loaded extension module utils, skipping build step... +20: Loading extension module utils... +17: No modifications detected for re-loaded extension module utils, skipping build step... +17: Loading extension module utils... +22: No modifications detected for re-loaded extension module utils, skipping build step... +22: Loading extension module utils... + 9: No modifications detected for re-loaded extension module utils, skipping build step... + 9: Loading extension module utils... + 5: No modifications detected for re-loaded extension module utils, skipping build step... + 5: Loading extension module utils... + 5: No modifications detected for re-loaded extension module utils, skipping build step... + 5: Loading extension module utils... + 5: No modifications detected for re-loaded extension module utils, skipping build step... + 5: Loading extension module utils... +11: No modifications detected for re-loaded extension module utils, skipping build step... +11: Loading extension module utils... +11: No modifications detected for re-loaded extension module utils, skipping build step... +11: Loading extension module utils... + 3: No modifications detected for re-loaded extension module utils, skipping build step... + 3: Loading extension module utils... + 6: No modifications detected for re-loaded extension module utils, skipping build step... + 6: Loading extension module utils... + 3: No modifications detected for re-loaded extension module utils, skipping build step... + 3: Loading extension module utils... +11: No modifications detected for re-loaded extension module utils, skipping build step... +11: Loading extension module utils... +14: No modifications detected for re-loaded extension module utils, skipping build step... +14: Loading extension module utils... +20: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +20: +20: Loading extension module utils...Loading extension module utils... +20: +23: No modifications detected for re-loaded extension module utils, skipping build step... +23: Loading extension module utils... +19: No modifications detected for re-loaded extension module utils, skipping build step... +19: Loading extension module utils... + 9: No modifications detected for re-loaded extension module utils, skipping build step... + 9: Loading extension module utils... + 9: No modifications detected for re-loaded extension module utils, skipping build step... + 9: Loading extension module utils... + 9: No modifications detected for re-loaded extension module utils, skipping build step... + 9: Loading extension module utils... + 9: No modifications detected for re-loaded extension module utils, skipping build step... + 9: Loading extension module utils... +17: No modifications detected for re-loaded extension module utils, skipping build step... +17: Loading extension module utils... + 4: No modifications detected for re-loaded extension module utils, skipping build step... + 4: Loading extension module utils... +20: No modifications detected for re-loaded extension module utils, skipping build step... +20: Loading extension module utils... + 6: No modifications detected for re-loaded extension module utils, skipping build step... + 6: Loading extension module utils... +20: No modifications detected for re-loaded extension module utils, skipping build step... +20: Loading extension module utils... +17: No modifications detected for re-loaded extension module utils, skipping build step... +17: Loading extension module utils... +19: No modifications detected for re-loaded extension module utils, skipping build step... +19: Loading extension module utils... +19: No modifications detected for re-loaded extension module utils, skipping build step... +19: Loading extension module utils... +19: No modifications detected for re-loaded extension module utils, skipping build step... +19: Loading extension module utils... +22: No modifications detected for re-loaded extension module utils, skipping build step... +22: Loading extension module utils... +15: No modifications detected for re-loaded extension module utils, skipping build step... +15: Loading extension module utils... + 2: No modifications detected for re-loaded extension module utils, skipping build step... + 2: Loading extension module utils... +18: No modifications detected for re-loaded extension module utils, skipping build step... +18: Loading extension module utils... +31: No modifications detected for re-loaded extension module utils, skipping build step... +31: Loading extension module utils... + 6: No modifications detected for re-loaded extension module utils, skipping build step... + 6: Loading extension module utils... +17: No modifications detected for re-loaded extension module utils, skipping build step... +17: Loading extension module utils... +15: No modifications detected for re-loaded extension module utils, skipping build step... +15: Loading extension module utils... +15: No modifications detected for re-loaded extension module utils, skipping build step... +15: Loading extension module utils... +23: No modifications detected for re-loaded extension module utils, skipping build step... +23: Loading extension module utils... +15: No modifications detected for re-loaded extension module utils, skipping build step... +15: Loading extension module utils... +28: No modifications detected for re-loaded extension module utils, skipping build step... +28: Loading extension module utils... + 4: No modifications detected for re-loaded extension module utils, skipping build step... + 4: Loading extension module utils... +23: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +23: +23: Loading extension module utils... +23: Loading extension module utils... +15: No modifications detected for re-loaded extension module utils, skipping build step... +15: Loading extension module utils... +31: No modifications detected for re-loaded extension module utils, skipping build step... +31: Loading extension module utils... +31: No modifications detected for re-loaded extension module utils, skipping build step... +31: Loading extension module utils... +23: No modifications detected for re-loaded extension module utils, skipping build step... +23: Loading extension module utils... +15: No modifications detected for re-loaded extension module utils, skipping build step... +15: Loading extension module utils... +24: No modifications detected for re-loaded extension module utils, skipping build step... +24: Loading extension module utils... +22: No modifications detected for re-loaded extension module utils, skipping build step... +22: Loading extension module utils... +22: No modifications detected for re-loaded extension module utils, skipping build step... +22: Loading extension module utils... +22: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +22: +22: Loading extension module utils... +31: No modifications detected for re-loaded extension module utils, skipping build step... +31: Loading extension module utils... +31: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +31: +31: Loading extension module utils... + 9: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... + 9: + 9: Loading extension module utils...Loading extension module utils... + 9: + 7: No modifications detected for re-loaded extension module utils, skipping build step... + 7: Loading extension module utils... +22: Loading extension module utils... +31: Loading extension module utils... + 9: No modifications detected for re-loaded extension module utils, skipping build step... + 9: Loading extension module utils... +20: No modifications detected for re-loaded extension module utils, skipping build step... +20: Loading extension module utils... + 2: No modifications detected for re-loaded extension module utils, skipping build step... + 2: Loading extension module utils... +31: No modifications detected for re-loaded extension module utils, skipping build step... +31: Loading extension module utils... +20: No modifications detected for re-loaded extension module utils, skipping build step... +20: Loading extension module utils... +19: No modifications detected for re-loaded extension module utils, skipping build step... +19: Loading extension module utils... +19: No modifications detected for re-loaded extension module utils, skipping build step... +19: Loading extension module utils...No modifications detected for re-loaded extension module utils, skipping build step... +19: +19: Loading extension module utils... +31: No modifications detected for re-loaded extension module utils, skipping build step... +28: No modifications detected for re-loaded extension module utils, skipping build step... +28: Loading extension module utils... + 3: No modifications detected for re-loaded extension module utils, skipping build step... + 3: Loading extension module utils... +31: Loading extension module utils... +19: No modifications detected for re-loaded extension module utils, skipping build step... +19: Loading extension module utils... +28: No modifications detected for re-loaded extension module utils, skipping build step... +28: No modifications detected for re-loaded extension module utils, skipping build step...Loading extension module utils... +28: +28: Loading extension module utils... + 3: No modifications detected for re-loaded extension module utils, skipping build step... + 3: Loading extension module utils... +24: No modifications detected for re-loaded extension module utils, skipping build step... +24: Loading extension module utils... +28: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +28: +28: Loading extension module utils... + 3: No modifications detected for re-loaded extension module utils, skipping build step... + 3: Loading extension module utils... + 5: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... + 5: + 5: Loading extension module utils...Loading extension module utils... + 5: + 2: No modifications detected for re-loaded extension module utils, skipping build step... + 2: Loading extension module utils... + 2: No modifications detected for re-loaded extension module utils, skipping build step... + 2: Loading extension module utils... + 2: No modifications detected for re-loaded extension module utils, skipping build step... +28: Loading extension module utils... + 2: Loading extension module utils... + 6: No modifications detected for re-loaded extension module utils, skipping build step... + 6: Loading extension module utils... + 6: No modifications detected for re-loaded extension module utils, skipping build step... + 6: Loading extension module utils... + 5: No modifications detected for re-loaded extension module utils, skipping build step... + 5: Loading extension module utils...No modifications detected for re-loaded extension module utils, skipping build step... + 2: No modifications detected for re-loaded extension module utils, skipping build step... + 2: Loading extension module utils... + 5: +18: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... +18: +18: Loading extension module utils...Loading extension module utils... +18: +18: No modifications detected for re-loaded extension module utils, skipping build step... +28: No modifications detected for re-loaded extension module utils, skipping build step... +28: Loading extension module utils... + 6: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... + 5: Loading extension module utils... + 6: Loading extension module utils... + 6: + 2: No modifications detected for re-loaded extension module utils, skipping build step... + 2: Loading extension module utils... + 6: Loading extension module utils... + 6: No modifications detected for re-loaded extension module utils, skipping build step... + 6: Loading extension module utils... + 4: No modifications detected for re-loaded extension module utils, skipping build step... + 4: Loading extension module utils... + 4: No modifications detected for re-loaded extension module utils, skipping build step... + 4: Loading extension module utils... + 5: No modifications detected for re-loaded extension module utils, skipping build step... + 5: Loading extension module utils... + 7: No modifications detected for re-loaded extension module utils, skipping build step... + 7: Loading extension module utils... + 7: No modifications detected for re-loaded extension module utils, skipping build step... + 7: Loading extension module utils... + 4: No modifications detected for re-loaded extension module utils, skipping build step... + 4: Loading extension module utils... +24: No modifications detected for re-loaded extension module utils, skipping build step... +24: Loading extension module utils... +24: No modifications detected for re-loaded extension module utils, skipping build step... +24: Loading extension module utils... +24: No modifications detected for re-loaded extension module utils, skipping build step... +24: Loading extension module utils... + 4: No modifications detected for re-loaded extension module utils, skipping build step...No modifications detected for re-loaded extension module utils, skipping build step... + 4: + 4: Loading extension module utils... + 4: Loading extension module utils... + 4: No modifications detected for re-loaded extension module utils, skipping build step... + 4: Loading extension module utils... + 7: No modifications detected for re-loaded extension module utils, skipping build step... + 7: Loading extension module utils... + 7: No modifications detected for re-loaded extension module utils, skipping build step... +24: No modifications detected for re-loaded extension module utils, skipping build step... +24: Loading extension module utils... +18: Loading extension module utils... + 7: No modifications detected for re-loaded extension module utils, skipping build step...Loading extension module utils... + 7: + 7: Loading extension module utils...No modifications detected for re-loaded extension module utils, skipping build step... + 7: +18: No modifications detected for re-loaded extension module utils, skipping build step... + 7: Loading extension module utils... +18: Loading extension module utils... +24: No modifications detected for re-loaded extension module utils, skipping build step... +24: Loading extension module utils... +18: No modifications detected for re-loaded extension module utils, skipping build step... +18: Loading extension module utils... +18: No modifications detected for re-loaded extension module utils, skipping build step... +18: Loading extension module utils... + 0: Using /pfs/lustrep4/users/muennighoff/.cache/torch_extensions/py39_cpu as PyTorch extensions root... + 0: No modifications detected for re-loaded extension module utils, skipping build step... + 0: Loading extension module utils... + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/utils.py:349: UserWarning: Parameter count with the embeddings will be inaccurate with PP > 1, as the first and last stage hold several copies of the embeddings + 0: warnings.warn("Parameter count with the embeddings will be inaccurate with PP > 1, as the first and last stage hold several copies of the embeddings") diff --git a/2b855b4bc4opt2/3509629.out b/2b855b4bc4opt2/3509629.out new file mode 100644 index 0000000000000000000000000000000000000000..13354bf6731eb178a7da5b76241e7a4625224b4c --- /dev/null +++ b/2b855b4bc4opt2/3509629.out @@ -0,0 +1,34358 @@ +Model parameters: d_model 2304 ffw_size 9216 kv_size 128 n_heads 18 n_layers 28 +Megatron-DeepSpeed/pretrain_gpt.py --tensor-model-parallel-size 1 --pipeline-model-parallel-size 1 --num-layers 28 --hidden-size 2304 --num-attention-heads 18 --kv-channels 128 --ffn-hidden-size 9216 --seq-length 2048 --max-position-embeddings 2048 --micro-batch-size 2 --global-batch-size 512 --train-samples 1 --vocab-file gpt2/vocab.json --merge-file gpt2/merges.txt --clip-grad 1.0 --kill-switch-path kill-switch-2b855b4bc4opt3val --bf16 --optimizer adam --adam-beta1 0.9 --adam-beta2 0.999 --adam-eps 1e-8 --lr 2e-4 --min-lr 2e-5 --lr-decay-style cosine --lr-decay-samples 1 --lr-warmup-samples 0 --clip-grad 1.0 --weight-decay 1e-1 --override-lr-scheduler --reset-progress --no-load-optim --log-interval 10 --save-interval 1000 --eval-interval 1 --eval-iters 100 --eval-only true --tensorboard-dir tensorboard_2b855b4bc4opt3val --tensorboard-queue-size 5 --log-timers-to-tensorboard --log-batch-size-to-tensorboard --log-validation-ppl-to-tensorboard --save lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3 --load lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3 --train-weighted-split-paths-path train1b5.txt --valid-weighted-split-paths-path val.txt --data-impl mmap --deepspeed --deepspeed_config ds_configs/3509629.json --zero-stage 0 +START 3509629: Sat 13 May 2023 12:56:11 AM EEST + 0: + 0: + 0: ======================= ROCm System Management Interface ======================= + 0: ================================= Concise Info ================================= + 0: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 0: 0 48.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 4 46.0c 99.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 6 37.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: ================================================================================ + 0: ============================= End of ROCm SMI Log ============================== + 1: + 1: + 1: ======================= ROCm System Management Interface ======================= + 1: ================================= Concise Info ================================= + 1: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 1: 0 48.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 2 39.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 4 47.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 6 37.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: ================================================================================ + 1: ============================= End of ROCm SMI Log ============================== + 5: + 5: + 5: ======================= ROCm System Management Interface ======================= + 5: ================================= Concise Info ================================= + 5: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 5: 0 50.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 2 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 4 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 6 46.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: ================================================================================ + 5: ============================= End of ROCm SMI Log ============================== + 3: + 3: + 3: ======================= ROCm System Management Interface ======================= + 3: ================================= Concise Info ================================= + 3: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 3: 0 51.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 2 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 4 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 6 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: ================================================================================ + 3: ============================= End of ROCm SMI Log ============================== +13: +13: +13: ======================= ROCm System Management Interface ======================= +13: ================================= Concise Info ================================= +13: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +13: 0 46.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 1 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 2 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 4 48.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 6 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: ================================================================================ +13: ============================= End of ROCm SMI Log ============================== + 8: + 8: + 8: ======================= ROCm System Management Interface ======================= + 8: ================================= Concise Info ================================= + 8: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 8: 0 45.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 2 48.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 4 44.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 6 36.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 7 53.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: ================================================================================ + 8: ============================= End of ROCm SMI Log ============================== +15: +15: +15: ======================= ROCm System Management Interface ======================= +15: ================================= Concise Info ================================= +15: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +15: 0 54.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 2 41.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 4 43.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 5 53.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 6 44.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: ================================================================================ +15: ============================= End of ROCm SMI Log ============================== +26: +26: +26: ======================= ROCm System Management Interface ======================= +26: ================================= Concise Info ================================= +26: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +26: 0 40.0c 100.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 2 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 4 49.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 6 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: ================================================================================ +26: ============================= End of ROCm SMI Log ============================== +24: +24: +24: ======================= ROCm System Management Interface ======================= +24: ================================= Concise Info ================================= +24: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +24: 0 48.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 2 44.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 4 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 6 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: ================================================================================ +24: ============================= End of ROCm SMI Log ============================== + 7: + 7: + 7: ======================= ROCm System Management Interface ======================= + 7: ================================= Concise Info ================================= + 7: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 7: 0 41.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 2 45.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 4 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 5 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 6 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: ================================================================================ + 7: ============================= End of ROCm SMI Log ============================== +30: +30: +30: ======================= ROCm System Management Interface ======================= +30: ================================= Concise Info ================================= +30: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +30: 0 47.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 2 42.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 4 47.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 6 46.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: ================================================================================ +30: ============================= End of ROCm SMI Log ============================== +16: +16: +16: ======================= ROCm System Management Interface ======================= +16: ================================= Concise Info ================================= +16: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +16: 0 45.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 2 38.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 4 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 6 43.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: ================================================================================ +16: ============================= End of ROCm SMI Log ============================== + 2: + 2: + 2: ======================= ROCm System Management Interface ======================= + 2: ================================= Concise Info ================================= + 2: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 2: 0 47.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 1 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 2 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 4 50.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 6 47.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: ================================================================================ + 2: ============================= End of ROCm SMI Log ============================== + 4: + 4: + 4: ======================= ROCm System Management Interface ======================= + 4: ================================= Concise Info ================================= + 4: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 4: 0 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 2 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 4 45.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 6 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: ================================================================================ + 4: ============================= End of ROCm SMI Log ============================== +11: +11: +11: ======================= ROCm System Management Interface ======================= +11: ================================= Concise Info ================================= +11: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +11: 0 48.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 2 44.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 4 43.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 6 44.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: ================================================================================ +11: ============================= End of ROCm SMI Log ============================== +18: +18: +18: ======================= ROCm System Management Interface ======================= +18: ================================= Concise Info ================================= +18: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +18: 0 47.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 2 43.0c 99.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 4 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 6 43.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: ================================================================================ +18: ============================= End of ROCm SMI Log ============================== +10: +10: +10: ======================= ROCm System Management Interface ======================= +10: ================================= Concise Info ================================= +10: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +10: 0 50.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 1 54.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 2 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 4 45.0c 79.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 6 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: ================================================================================ +10: ============================= End of ROCm SMI Log ============================== +29: +29: +29: ======================= ROCm System Management Interface ======================= +29: ================================= Concise Info ================================= +29: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +29: 0 48.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 2 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 4 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 6 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: ================================================================================ +29: ============================= End of ROCm SMI Log ============================== +21: +21: +21: ======================= ROCm System Management Interface ======================= +21: ================================= Concise Info ================================= +21: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +21: 0 48.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 2 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 4 49.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 6 48.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: ================================================================================ +21: ============================= End of ROCm SMI Log ============================== +22: +22: +22: ======================= ROCm System Management Interface ======================= +22: ================================= Concise Info ================================= +22: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +22: 0 43.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 2 40.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 4 46.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 6 43.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: ================================================================================ +22: ============================= End of ROCm SMI Log ============================== +14: +14: +14: ======================= ROCm System Management Interface ======================= +14: ================================= Concise Info ================================= +14: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +14: 0 52.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 2 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 4 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 5 54.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 6 46.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: ================================================================================ +14: ============================= End of ROCm SMI Log ============================== +28: +28: +28: ======================= ROCm System Management Interface ======================= +28: ================================= Concise Info ================================= +28: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +28: 0 50.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 1 54.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 2 45.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 4 43.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 6 43.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: ================================================================================ +28: ============================= End of ROCm SMI Log ============================== +23: +23: +23: ======================= ROCm System Management Interface ======================= +23: ================================= Concise Info ================================= +23: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +23: 0 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 2 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 6 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: ================================================================================ +23: ============================= End of ROCm SMI Log ============================== +19: +19: +19: ======================= ROCm System Management Interface ======================= +19: ================================= Concise Info ================================= +19: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +19: 0 49.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 1 54.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 2 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 4 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 6 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: ================================================================================ +19: ============================= End of ROCm SMI Log ============================== +12: +12: +12: ======================= ROCm System Management Interface ======================= +12: ================================= Concise Info ================================= +12: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +12: 0 48.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 2 46.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 4 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 6 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: ================================================================================ +12: ============================= End of ROCm SMI Log ============================== +31: +31: +31: ======================= ROCm System Management Interface ======================= +31: ================================= Concise Info ================================= +31: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +31: 0 47.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 1 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 2 43.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 4 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 6 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: ================================================================================ +31: ============================= End of ROCm SMI Log ============================== +25: +25: +25: ======================= ROCm System Management Interface ======================= +25: ================================= Concise Info ================================= +25: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +25: 0 48.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 2 48.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 4 43.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 6 47.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: ================================================================================ +25: ============================= End of ROCm SMI Log ============================== + 6: + 6: + 6: ======================= ROCm System Management Interface ======================= + 6: ================================= Concise Info ================================= + 6: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 6: 0 52.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 2 44.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 4 51.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 6 39.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: ================================================================================ + 6: ============================= End of ROCm SMI Log ============================== +20: +20: +20: ======================= ROCm System Management Interface ======================= +20: ================================= Concise Info ================================= +20: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +20: 0 50.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 2 49.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 4 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 6 37.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: ================================================================================ +20: ============================= End of ROCm SMI Log ============================== +27: +27: +27: ======================= ROCm System Management Interface ======================= +27: ================================= Concise Info ================================= +27: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +27: 0 48.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 2 44.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 4 46.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 6 43.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: ================================================================================ +27: ============================= End of ROCm SMI Log ============================== +17: +17: +17: ======================= ROCm System Management Interface ======================= +17: ================================= Concise Info ================================= +17: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +17: 0 46.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 2 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 4 40.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 6 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 7 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: ================================================================================ +17: ============================= End of ROCm SMI Log ============================== + 9: + 9: + 9: ======================= ROCm System Management Interface ======================= + 9: ================================= Concise Info ================================= + 9: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 9: 0 45.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 2 35.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 4 45.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 6 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: ================================================================================ + 9: ============================= End of ROCm SMI Log ============================== +11: Launching on nid006114 (11/32), master nid005249 port 9999, GPUs 8, CUDA: True + 3: Launching on nid005448 (3/32), master nid005249 port 9999, GPUs 8, CUDA: True + 8: Launching on nid005788 (8/32), master nid005249 port 9999, GPUs 8, CUDA: True + 5: Launching on nid005533 (5/32), master nid005249 port 9999, GPUs 8, CUDA: True + 7: Launching on nid005714 (7/32), master nid005249 port 9999, GPUs 8, CUDA: True + 0: Launching on nid005249 (0/32), master nid005249 port 9999, GPUs 8, CUDA: True +30: Launching on nid007238 (30/32), master nid005249 port 9999, GPUs 8, CUDA: True +24: Launching on nid006850 (24/32), master nid005249 port 9999, GPUs 8, CUDA: True +29: Launching on nid007194 (29/32), master nid005249 port 9999, GPUs 8, CUDA: True + 2: Launching on nid005389 (2/32), master nid005249 port 9999, GPUs 8, CUDA: True +28: Launching on nid007193 (28/32), master nid005249 port 9999, GPUs 8, CUDA: True +15: Launching on nid006519 (15/32), master nid005249 port 9999, GPUs 8, CUDA: True +10: Launching on nid005908 (10/32), master nid005249 port 9999, GPUs 8, CUDA: True +26: Launching on nid006979 (26/32), master nid005249 port 9999, GPUs 8, CUDA: True +14: Launching on nid006437 (14/32), master nid005249 port 9999, GPUs 8, CUDA: True +22: Launching on nid006694 (22/32), master nid005249 port 9999, GPUs 8, CUDA: True + 4: Launching on nid005521 (4/32), master nid005249 port 9999, GPUs 8, CUDA: True +19: Launching on nid006676 (19/32), master nid005249 port 9999, GPUs 8, CUDA: True +16: Launching on nid006534 (16/32), master nid005249 port 9999, GPUs 8, CUDA: True + 1: Launching on nid005299 (1/32), master nid005249 port 9999, GPUs 8, CUDA: True +13: Launching on nid006219 (13/32), master nid005249 port 9999, GPUs 8, CUDA: True +18: Launching on nid006601 (18/32), master nid005249 port 9999, GPUs 8, CUDA: True +23: Launching on nid006770 (23/32), master nid005249 port 9999, GPUs 8, CUDA: True +21: Launching on nid006693 (21/32), master nid005249 port 9999, GPUs 8, CUDA: True +17: Launching on nid006600 (17/32), master nid005249 port 9999, GPUs 8, CUDA: True +31: Launching on nid007239 (31/32), master nid005249 port 9999, GPUs 8, CUDA: True +25: Launching on nid006851 (25/32), master nid005249 port 9999, GPUs 8, CUDA: True + 9: Launching on nid005888 (9/32), master nid005249 port 9999, GPUs 8, CUDA: True + 6: Launching on nid005609 (6/32), master nid005249 port 9999, GPUs 8, CUDA: True +27: Launching on nid007068 (27/32), master nid005249 port 9999, GPUs 8, CUDA: True +20: Launching on nid006677 (20/32), master nid005249 port 9999, GPUs 8, CUDA: True +12: Launching on nid006218 (12/32), master nid005249 port 9999, GPUs 8, CUDA: True + 0: using world size: 256, data-parallel-size: 256, tensor-model-parallel size: 1, pipeline-model-parallel size: 1 + 0: accumulate and all-reduce gradients in fp32 for bfloat16 data type. + 0: using torch.bfloat16 for parameters ... + 0: ------------------------ arguments ------------------------ + 0: abort_on_unmet_fused_kernel_constraints ......... False + 0: accumulate_allreduce_grads_in_fp32 .............. True + 0: adam_beta1 ...................................... 0.9 + 0: adam_beta2 ...................................... 0.999 + 0: adam_eps ........................................ 1e-08 + 0: adlr_autoresume ................................. False + 0: adlr_autoresume_interval ........................ 1000 + 0: apply_query_key_layer_scaling ................... True + 0: apply_residual_connection_post_layernorm ........ False + 0: attention_dropout ............................... 0.1 + 0: attention_softmax_in_fp32 ....................... False + 0: bert_binary_head ................................ True + 0: bert_load ....................................... None + 0: bf16 ............................................ True + 0: bias_dropout_fusion ............................. True + 0: bias_gelu_fusion ................................ True + 0: biencoder_projection_dim ........................ 0 + 0: biencoder_shared_query_context_model ............ False + 0: block_data_path ................................. None + 0: checkpoint_activations .......................... False + 0: checkpoint_in_cpu ............................... False + 0: checkpoint_num_layers ........................... 1 + 0: clip_grad ....................................... 1.0 + 0: codecarbon_dir .................................. None + 0: consumed_train_samples .......................... 0 + 0: consumed_train_tokens ........................... 0 + 0: consumed_valid_samples .......................... 0 + 0: contigious_checkpointing ........................ False + 0: cpu_optimizer ................................... False + 0: cpu_torch_adam .................................. False + 0: curriculum_learning ............................. False + 0: data_impl ....................................... mmap + 0: data_parallel_size .............................. 256 + 0: data_path ....................................... None + 0: dataloader_type ................................. single + 0: DDP_impl ........................................ local + 0: decoder_seq_length .............................. None + 0: deepscale ....................................... False + 0: deepscale_config ................................ None + 0: deepspeed ....................................... True + 0: deepspeed_activation_checkpointing .............. False + 0: deepspeed_config ................................ ds_configs/3509629.json + 0: deepspeed_mpi ................................... False + 0: distribute_checkpointed_activations ............. False + 0: distributed_backend ............................. nccl + 0: embed_layernorm ................................. False + 0: embedding_path .................................. None + 0: encoder_seq_length .............................. 2048 + 0: eod_mask_loss ................................... False + 0: eval_interval ................................... 1 + 0: eval_iters ...................................... 100 + 0: eval_only ....................................... True + 0: evidence_data_path .............................. None + 0: exit_duration_in_mins ........................... None + 0: exit_interval ................................... None + 0: ffn_hidden_size ................................. 9216 + 0: finetune ........................................ False + 0: fp16 ............................................ False + 0: fp16_lm_cross_entropy ........................... False + 0: fp32_residual_connection ........................ False + 0: gigaflos_no_embeds .............................. 0 + 0: global_batch_size ............................... 512 + 0: glu_activation .................................. None + 0: hidden_dropout .................................. 0.1 + 0: hidden_size ..................................... 2304 + 0: hysteresis ...................................... 2 + 0: ict_head_size ................................... None + 0: ict_load ........................................ None + 0: img_dim ......................................... 224 + 0: indexer_batch_size .............................. 128 + 0: indexer_log_interval ............................ 1000 + 0: inference ....................................... False + 0: init_method_std ................................. 0.02 + 0: init_method_xavier_uniform ...................... False + 0: initial_loss_scale .............................. 4294967296 + 0: kill_switch_path ................................ kill-switch-2b855b4bc4opt3val + 0: kv_channels ..................................... 128 + 0: layer_norm_fusion ............................... True + 0: layernorm_epsilon ............................... 1e-05 + 0: lazy_mpu_init ................................... None + 0: load ............................................ lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3 + 0: local_rank ...................................... None + 0: log_batch_size_to_tensorboard ................... True + 0: log_interval .................................... 10 + 0: log_learning_rate_to_tensorboard ................ True + 0: log_level ....................................... None + 0: log_level_replica ............................... None + 0: log_loss_scale_to_tensorboard ................... True + 0: log_num_zeros_in_grad ........................... False + 0: log_params_norm ................................. False + 0: log_path ........................................ None + 0: log_timers_to_tensorboard ....................... True + 0: log_validation_ppl_to_tensorboard ............... True + 0: loss_on_targets_only ............................ False + 0: loss_scale ...................................... None + 0: loss_scale_window ............................... 1000 + 0: lr .............................................. 0.0002 + 0: lr_decay_iters .................................. None + 0: lr_decay_samples ................................ 1 + 0: lr_decay_style .................................. cosine + 0: lr_decay_tokens ................................. None + 0: lr_warmup_fraction .............................. None + 0: lr_warmup_iters ................................. 0 + 0: lr_warmup_samples ............................... 0 + 0: make_vocab_size_divisible_by .................... 128 + 0: mask_prob ....................................... 0.15 + 0: masked_softmax_fusion ........................... True + 0: max_position_embeddings ......................... 2048 + 0: mean_noise_span_length .......................... None + 0: memory_centric_tiled_linear ..................... False + 0: merge_file ...................................... gpt2/merges.txt + 0: micro_batch_size ................................ 2 + 0: min_loss_scale .................................. 1.0 + 0: min_lr .......................................... 2e-05 + 0: mmap_warmup ..................................... False + 0: no_load_optim ................................... True + 0: no_load_rng ..................................... None + 0: no_save_optim ................................... None + 0: no_save_rng ..................................... None + 0: noise_density ................................... None + 0: num_attention_heads ............................. 18 + 0: num_channels .................................... 3 + 0: num_classes ..................................... 1000 + 0: num_layers ...................................... 28 + 0: num_layers_per_virtual_pipeline_stage ........... None + 0: num_workers ..................................... 2 + 0: onnx_safe ....................................... None + 0: openai_gelu ..................................... False + 0: optimizer ....................................... adam + 0: optimizer_fusion ................................ True + 0: override_lr_scheduler ........................... True + 0: pad_vocab_size_to ............................... None + 0: params_dtype .................................... torch.bfloat16 + 0: partition_activations ........................... False + 0: patch_dim ....................................... 16 + 0: pipeline_model_parallel_size .................... 1 + 0: position_embedding_type ......................... PositionEmbeddingType.absolute + 0: pp_partition_method ............................. None + 0: profile_backward ................................ False + 0: query_in_block_prob ............................. 0.1 + 0: rampup_batch_size ............................... None + 0: rank ............................................ 0 + 0: remote_device ................................... none + 0: reset_attention_mask ............................ False + 0: reset_position_ids .............................. False + 0: reset_progress .................................. True + 0: retriever_report_topk_accuracies ................ [] + 0: retriever_score_scaling ......................... False + 0: retriever_seq_length ............................ 256 + 0: reweight_loss_based_on_position_frequency ....... False + 0: sample_rate ..................................... 1.0 + 0: save ............................................ lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3 + 0: save_interval ................................... 1000 + 0: scatter_gather_tensors_in_pipeline .............. True + 0: scattered_embeddings ............................ False + 0: seed ............................................ 1234 + 0: seq_length ...................................... 2048 + 0: sgd_momentum .................................... 0.9 + 0: short_seq_prob .................................. 0.1 + 0: skip_train_iteration_range ...................... None + 0: split ........................................... None + 0: split_transformers .............................. False + 0: sync_tp_duplicated_parameters ................... False + 0: synchronize_each_layer .......................... False + 0: tensor_model_parallel_size ...................... 1 + 0: tensorboard_dir ................................. tensorboard_2b855b4bc4opt3val + 0: tensorboard_log_interval ........................ 1 + 0: tensorboard_queue_size .......................... 5 + 0: test_weighted_split_paths ....................... None + 0: test_weighted_split_paths_path .................. None + 0: tile_factor ..................................... 1 + 0: titles_data_path ................................ None + 0: tokenizer_name_or_path .......................... None + 0: tokenizer_type .................................. GPT2BPETokenizer + 0: train_iters ..................................... None + 0: train_samples ................................... 1 + 0: train_tokens .................................... None + 0: train_weighted_split_names ...................... ['train'] + 0: train_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document']] + 0: train_weighted_split_paths_path ................. None + 0: train_weighted_split_splits ..................... [['0:1']] + 0: train_weighted_split_weights .................... [['1.0']] + 0: universal_checkpoint ............................ False + 0: use_bnb_optimizer ............................... False + 0: use_checkpoint_lr_scheduler ..................... False + 0: use_contiguous_buffers_in_ddp ................... True + 0: use_cpu_initialization .......................... None + 0: use_one_sent_docs ............................... False + 0: use_pin_memory .................................. False + 0: valid_num_workers ............................... 2 + 0: valid_weighted_split_names ...................... ['validation'] + 0: valid_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document']] + 0: valid_weighted_split_paths_path ................. None + 0: valid_weighted_split_splits ..................... [['0:1']] + 0: valid_weighted_split_weights .................... [['1.0']] + 0: virtual_pipeline_model_parallel_size ............ None + 0: vocab_extra_ids ................................. 0 + 0: vocab_file ...................................... gpt2/vocab.json + 0: weight_decay .................................... 0.1 + 0: world_size ...................................... 256 + 0: zero_allgather_bucket_size ...................... 0.0 + 0: zero_contigious_gradients ....................... False + 0: zero_reduce_bucket_size ......................... 0.0 + 0: zero_reduce_scatter ............................. False + 0: zero_stage ...................................... 0 + 0: -------------------- end of arguments --------------------- + 0: setting number of micro-batches to constant 1 + 0: > building GPT2BPETokenizer tokenizer ... + 0: > padded vocab (size: 50257) with 47 dummy tokens (new size: 50304) + 0: DeepSpeed general environment info: + 0: torch install path ............... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch'] + 0: torch version .................... 1.13.0+rocm5.2 + 0: torch cuda version ............... None + 0: torch hip version ................ 5.2.21151-afdc89f8 + 0: nvcc version ..................... None + 0: deepspeed install path ........... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/deepspeed'] + 0: deepspeed info ................... 0.7.5, unknown, unknown + 0: deepspeed wheel compiled w. ...... torch 1.13, hip 5.1 +31: > setting tensorboard ... + 0: **** Git info for Megatron: git_hash=unknown git_branch=unknown **** + 0: > initializing torch distributed ... + 0: [2023-05-13 00:58:45,842] [INFO] [comm.py:633:init_distributed] Initializing TorchBackend in DeepSpeed with backend nccl + 0: > initializing tensor model parallel with size 1 + 0: > initializing pipeline model parallel with size 1 + 0: > setting random seeds to 1234 ... + 0: > initializing model parallel cuda seeds on global rank 0, model parallel rank 0, and data parallel rank 0 with model parallel seed: 3952 and data parallel seed: 1234 + 0: > compiling dataset index builder ... + 0: make: Entering directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: make: Nothing to be done for 'default'. + 0: make: Leaving directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: >>> done with dataset index builder. Compilation time: 0.091 seconds + 0: > compiling and loading fused kernels ... + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 87 + 0: ninja: no work to do. + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 63 + 0: ninja: no work to do. + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda_kernel.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_hip_kernel.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 67 + 0: [1/1] c++ layer_norm_hip_kernel.cuda.o layer_norm_cuda.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o fused_mix_prec_layer_norm_cuda.so + 0: >>> done with compiling and loading fused kernels. Compilation time: 31.212 seconds + 0: time to initialize megatron (seconds): 64.132 + 0: [after megatron is initialized] datetime: 2023-05-13 00:59:28 + 0: building GPT model ... + 0: [2023-05-13 00:59:28,279] [INFO] [utils.py:827:see_memory_usage] Before Building Model + 0: [2023-05-13 00:59:28,280] [INFO] [utils.py:828:see_memory_usage] MA 0.0 GB Max_MA 0.0 GB CA 0.0 GB Max_CA 0 GB + 0: [2023-05-13 00:59:28,280] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 37.17 GB, percent = 7.4% + 0: SEED_LAYERS=False BASE_SEED=1234 SEED_FN=None + 0: Using topology: {ProcessCoord(pipe=0, data=0, model=0): 0, ProcessCoord(pipe=0, data=1, model=0): 1, ProcessCoord(pipe=0, data=2, model=0): 2, ProcessCoord(pipe=0, data=3, model=0): 3, ProcessCoord(pipe=0, data=4, model=0): 4, ProcessCoord(pipe=0, data=5, model=0): 5, ProcessCoord(pipe=0, data=6, model=0): 6, ProcessCoord(pipe=0, data=7, model=0): 7, ProcessCoord(pipe=0, data=8, model=0): 8, ProcessCoord(pipe=0, data=9, model=0): 9, ProcessCoord(pipe=0, data=10, model=0): 10, ProcessCoord(pipe=0, data=11, model=0): 11, ProcessCoord(pipe=0, data=12, model=0): 12, ProcessCoord(pipe=0, data=13, model=0): 13, ProcessCoord(pipe=0, data=14, model=0): 14, ProcessCoord(pipe=0, data=15, model=0): 15, ProcessCoord(pipe=0, data=16, model=0): 16, ProcessCoord(pipe=0, data=17, model=0): 17, ProcessCoord(pipe=0, data=18, model=0): 18, ProcessCoord(pipe=0, data=19, model=0): 19, ProcessCoord(pipe=0, data=20, model=0): 20, ProcessCoord(pipe=0, data=21, model=0): 21, ProcessCoord(pipe=0, data=22, model=0): 22, ProcessCoord(pi + 0: pe=0, data=23, model=0): 23, ProcessCoord(pipe=0, data=24, model=0): 24, ProcessCoord(pipe=0, data=25, model=0): 25, ProcessCoord(pipe=0, data=26, model=0): 26, ProcessCoord(pipe=0, data=27, model=0): 27, ProcessCoord(pipe=0, data=28, model=0): 28, ProcessCoord(pipe=0, data=29, model=0): 29, ProcessCoord(pipe=0, data=30, model=0): 30, ProcessCoord(pipe=0, data=31, model=0): 31, ProcessCoord(pipe=0, data=32, model=0): 32, ProcessCoord(pipe=0, data=33, model=0): 33, ProcessCoord(pipe=0, data=34, model=0): 34, ProcessCoord(pipe=0, data=35, model=0): 35, ProcessCoord(pipe=0, data=36, model=0): 36, ProcessCoord(pipe=0, data=37, model=0): 37, ProcessCoord(pipe=0, data=38, model=0): 38, ProcessCoord(pipe=0, data=39, model=0): 39, ProcessCoord(pipe=0, data=40, model=0): 40, ProcessCoord(pipe=0, data=41, model=0): 41, ProcessCoord(pipe=0, data=42, model=0): 42, ProcessCoord(pipe=0, data=43, model=0): 43, ProcessCoord(pipe=0, data=44, model=0): 44, ProcessCoord(pipe=0, data=45, model=0): 45, ProcessCoord(pipe=0, data=4 + 0: 6, model=0): 46, ProcessCoord(pipe=0, data=47, model=0): 47, ProcessCoord(pipe=0, data=48, model=0): 48, ProcessCoord(pipe=0, data=49, model=0): 49, ProcessCoord(pipe=0, data=50, model=0): 50, ProcessCoord(pipe=0, data=51, model=0): 51, ProcessCoord(pipe=0, data=52, model=0): 52, ProcessCoord(pipe=0, data=53, model=0): 53, ProcessCoord(pipe=0, data=54, model=0): 54, ProcessCoord(pipe=0, data=55, model=0): 55, ProcessCoord(pipe=0, data=56, model=0): 56, ProcessCoord(pipe=0, data=57, model=0): 57, ProcessCoord(pipe=0, data=58, model=0): 58, ProcessCoord(pipe=0, data=59, model=0): 59, ProcessCoord(pipe=0, data=60, model=0): 60, ProcessCoord(pipe=0, data=61, model=0): 61, ProcessCoord(pipe=0, data=62, model=0): 62, ProcessCoord(pipe=0, data=63, model=0): 63, ProcessCoord(pipe=0, data=64, model=0): 64, ProcessCoord(pipe=0, data=65, model=0): 65, ProcessCoord(pipe=0, data=66, model=0): 66, ProcessCoord(pipe=0, data=67, model=0): 67, ProcessCoord(pipe=0, data=68, model=0): 68, ProcessCoord(pipe=0, data=69, model=0): + 0: 69, ProcessCoord(pipe=0, data=70, model=0): 70, ProcessCoord(pipe=0, data=71, model=0): 71, ProcessCoord(pipe=0, data=72, model=0): 72, ProcessCoord(pipe=0, data=73, model=0): 73, ProcessCoord(pipe=0, data=74, model=0): 74, ProcessCoord(pipe=0, data=75, model=0): 75, ProcessCoord(pipe=0, data=76, model=0): 76, ProcessCoord(pipe=0, data=77, model=0): 77, ProcessCoord(pipe=0, data=78, model=0): 78, ProcessCoord(pipe=0, data=79, model=0): 79, ProcessCoord(pipe=0, data=80, model=0): 80, ProcessCoord(pipe=0, data=81, model=0): 81, ProcessCoord(pipe=0, data=82, model=0): 82, ProcessCoord(pipe=0, data=83, model=0): 83, ProcessCoord(pipe=0, data=84, model=0): 84, ProcessCoord(pipe=0, data=85, model=0): 85, ProcessCoord(pipe=0, data=86, model=0): 86, ProcessCoord(pipe=0, data=87, model=0): 87, ProcessCoord(pipe=0, data=88, model=0): 88, ProcessCoord(pipe=0, data=89, model=0): 89, ProcessCoord(pipe=0, data=90, model=0): 90, ProcessCoord(pipe=0, data=91, model=0): 91, ProcessCoord(pipe=0, data=92, model=0): 92, Process + 0: Coord(pipe=0, data=93, model=0): 93, ProcessCoord(pipe=0, data=94, model=0): 94, ProcessCoord(pipe=0, data=95, model=0): 95, ProcessCoord(pipe=0, data=96, model=0): 96, ProcessCoord(pipe=0, data=97, model=0): 97, ProcessCoord(pipe=0, data=98, model=0): 98, ProcessCoord(pipe=0, data=99, model=0): 99, ProcessCoord(pipe=0, data=100, model=0): 100, ProcessCoord(pipe=0, data=101, model=0): 101, ProcessCoord(pipe=0, data=102, model=0): 102, ProcessCoord(pipe=0, data=103, model=0): 103, ProcessCoord(pipe=0, data=104, model=0): 104, ProcessCoord(pipe=0, data=105, model=0): 105, ProcessCoord(pipe=0, data=106, model=0): 106, ProcessCoord(pipe=0, data=107, model=0): 107, ProcessCoord(pipe=0, data=108, model=0): 108, ProcessCoord(pipe=0, data=109, model=0): 109, ProcessCoord(pipe=0, data=110, model=0): 110, ProcessCoord(pipe=0, data=111, model=0): 111, ProcessCoord(pipe=0, data=112, model=0): 112, ProcessCoord(pipe=0, data=113, model=0): 113, ProcessCoord(pipe=0, data=114, model=0): 114, ProcessCoord(pipe=0, data=115, mo + 0: del=0): 115, ProcessCoord(pipe=0, data=116, model=0): 116, ProcessCoord(pipe=0, data=117, model=0): 117, ProcessCoord(pipe=0, data=118, model=0): 118, ProcessCoord(pipe=0, data=119, model=0): 119, ProcessCoord(pipe=0, data=120, model=0): 120, ProcessCoord(pipe=0, data=121, model=0): 121, ProcessCoord(pipe=0, data=122, model=0): 122, ProcessCoord(pipe=0, data=123, model=0): 123, ProcessCoord(pipe=0, data=124, model=0): 124, ProcessCoord(pipe=0, data=125, model=0): 125, ProcessCoord(pipe=0, data=126, model=0): 126, ProcessCoord(pipe=0, data=127, model=0): 127, ProcessCoord(pipe=0, data=128, model=0): 128, ProcessCoord(pipe=0, data=129, model=0): 129, ProcessCoord(pipe=0, data=130, model=0): 130, ProcessCoord(pipe=0, data=131, model=0): 131, ProcessCoord(pipe=0, data=132, model=0): 132, ProcessCoord(pipe=0, data=133, model=0): 133, ProcessCoord(pipe=0, data=134, model=0): 134, ProcessCoord(pipe=0, data=135, model=0): 135, ProcessCoord(pipe=0, data=136, model=0): 136, ProcessCoord(pipe=0, data=137, model=0): 137, + 0: ProcessCoord(pipe=0, data=138, model=0): 138, ProcessCoord(pipe=0, data=139, model=0): 139, ProcessCoord(pipe=0, data=140, model=0): 140, ProcessCoord(pipe=0, data=141, model=0): 141, ProcessCoord(pipe=0, data=142, model=0): 142, ProcessCoord(pipe=0, data=143, model=0): 143, ProcessCoord(pipe=0, data=144, model=0): 144, ProcessCoord(pipe=0, data=145, model=0): 145, ProcessCoord(pipe=0, data=146, model=0): 146, ProcessCoord(pipe=0, data=147, model=0): 147, ProcessCoord(pipe=0, data=148, model=0): 148, ProcessCoord(pipe=0, data=149, model=0): 149, ProcessCoord(pipe=0, data=150, model=0): 150, ProcessCoord(pipe=0, data=151, model=0): 151, ProcessCoord(pipe=0, data=152, model=0): 152, ProcessCoord(pipe=0, data=153, model=0): 153, ProcessCoord(pipe=0, data=154, model=0): 154, ProcessCoord(pipe=0, data=155, model=0): 155, ProcessCoord(pipe=0, data=156, model=0): 156, ProcessCoord(pipe=0, data=157, model=0): 157, ProcessCoord(pipe=0, data=158, model=0): 158, ProcessCoord(pipe=0, data=159, model=0): 159, ProcessCoor + 0: d(pipe=0, data=160, model=0): 160, ProcessCoord(pipe=0, data=161, model=0): 161, ProcessCoord(pipe=0, data=162, model=0): 162, ProcessCoord(pipe=0, data=163, model=0): 163, ProcessCoord(pipe=0, data=164, model=0): 164, ProcessCoord(pipe=0, data=165, model=0): 165, ProcessCoord(pipe=0, data=166, model=0): 166, ProcessCoord(pipe=0, data=167, model=0): 167, ProcessCoord(pipe=0, data=168, model=0): 168, ProcessCoord(pipe=0, data=169, model=0): 169, ProcessCoord(pipe=0, data=170, model=0): 170, ProcessCoord(pipe=0, data=171, model=0): 171, ProcessCoord(pipe=0, data=172, model=0): 172, ProcessCoord(pipe=0, data=173, model=0): 173, ProcessCoord(pipe=0, data=174, model=0): 174, ProcessCoord(pipe=0, data=175, model=0): 175, ProcessCoord(pipe=0, data=176, model=0): 176, ProcessCoord(pipe=0, data=177, model=0): 177, ProcessCoord(pipe=0, data=178, model=0): 178, ProcessCoord(pipe=0, data=179, model=0): 179, ProcessCoord(pipe=0, data=180, model=0): 180, ProcessCoord(pipe=0, data=181, model=0): 181, ProcessCoord(pipe=0, da + 0: ta=182, model=0): 182, ProcessCoord(pipe=0, data=183, model=0): 183, ProcessCoord(pipe=0, data=184, model=0): 184, ProcessCoord(pipe=0, data=185, model=0): 185, ProcessCoord(pipe=0, data=186, model=0): 186, ProcessCoord(pipe=0, data=187, model=0): 187, ProcessCoord(pipe=0, data=188, model=0): 188, ProcessCoord(pipe=0, data=189, model=0): 189, ProcessCoord(pipe=0, data=190, model=0): 190, ProcessCoord(pipe=0, data=191, model=0): 191, ProcessCoord(pipe=0, data=192, model=0): 192, ProcessCoord(pipe=0, data=193, model=0): 193, ProcessCoord(pipe=0, data=194, model=0): 194, ProcessCoord(pipe=0, data=195, model=0): 195, ProcessCoord(pipe=0, data=196, model=0): 196, ProcessCoord(pipe=0, data=197, model=0): 197, ProcessCoord(pipe=0, data=198, model=0): 198, ProcessCoord(pipe=0, data=199, model=0): 199, ProcessCoord(pipe=0, data=200, model=0): 200, ProcessCoord(pipe=0, data=201, model=0): 201, ProcessCoord(pipe=0, data=202, model=0): 202, ProcessCoord(pipe=0, data=203, model=0): 203, ProcessCoord(pipe=0, data=204, mode + 0: l=0): 204, ProcessCoord(pipe=0, data=205, model=0): 205, ProcessCoord(pipe=0, data=206, model=0): 206, ProcessCoord(pipe=0, data=207, model=0): 207, ProcessCoord(pipe=0, data=208, model=0): 208, ProcessCoord(pipe=0, data=209, model=0): 209, ProcessCoord(pipe=0, data=210, model=0): 210, ProcessCoord(pipe=0, data=211, model=0): 211, ProcessCoord(pipe=0, data=212, model=0): 212, ProcessCoord(pipe=0, data=213, model=0): 213, ProcessCoord(pipe=0, data=214, model=0): 214, ProcessCoord(pipe=0, data=215, model=0): 215, ProcessCoord(pipe=0, data=216, model=0): 216, ProcessCoord(pipe=0, data=217, model=0): 217, ProcessCoord(pipe=0, data=218, model=0): 218, ProcessCoord(pipe=0, data=219, model=0): 219, ProcessCoord(pipe=0, data=220, model=0): 220, ProcessCoord(pipe=0, data=221, model=0): 221, ProcessCoord(pipe=0, data=222, model=0): 222, ProcessCoord(pipe=0, data=223, model=0): 223, ProcessCoord(pipe=0, data=224, model=0): 224, ProcessCoord(pipe=0, data=225, model=0): 225, ProcessCoord(pipe=0, data=226, model=0): 226, P + 0: rocessCoord(pipe=0, data=227, model=0): 227, ProcessCoord(pipe=0, data=228, model=0): 228, ProcessCoord(pipe=0, data=229, model=0): 229, ProcessCoord(pipe=0, data=230, model=0): 230, ProcessCoord(pipe=0, data=231, model=0): 231, ProcessCoord(pipe=0, data=232, model=0): 232, ProcessCoord(pipe=0, data=233, model=0): 233, ProcessCoord(pipe=0, data=234, model=0): 234, ProcessCoord(pipe=0, data=235, model=0): 235, ProcessCoord(pipe=0, data=236, model=0): 236, ProcessCoord(pipe=0, data=237, model=0): 237, ProcessCoord(pipe=0, data=238, model=0): 238, ProcessCoord(pipe=0, data=239, model=0): 239, ProcessCoord(pipe=0, data=240, model=0): 240, ProcessCoord(pipe=0, data=241, model=0): 241, ProcessCoord(pipe=0, data=242, model=0): 242, ProcessCoord(pipe=0, data=243, model=0): 243, ProcessCoord(pipe=0, data=244, model=0): 244, ProcessCoord(pipe=0, data=245, model=0): 245, ProcessCoord(pipe=0, data=246, model=0): 246, ProcessCoord(pipe=0, data=247, model=0): 247, ProcessCoord(pipe=0, data=248, model=0): 248, ProcessCoord( + 0: pipe=0, data=249, model=0): 249, ProcessCoord(pipe=0, data=250, model=0): 250, ProcessCoord(pipe=0, data=251, model=0): 251, ProcessCoord(pipe=0, data=252, model=0): 252, ProcessCoord(pipe=0, data=253, model=0): 253, ProcessCoord(pipe=0, data=254, model=0): 254, ProcessCoord(pipe=0, data=255, model=0): 255} + 0: [2023-05-13 00:59:36,451] [INFO] [module.py:366:_partition_layers] Partitioning pipeline stages with method type:transformer + 0: stage=0 layers=35 + 0: 0: _to_float16 + 0: 1: EmbeddingPipe + 0: 2: + 0: 3: ParallelTransformerLayerPipe + 0: 4: ParallelTransformerLayerPipe + 0: 5: ParallelTransformerLayerPipe + 0: 6: ParallelTransformerLayerPipe + 0: 7: ParallelTransformerLayerPipe + 0: 8: ParallelTransformerLayerPipe + 0: 9: ParallelTransformerLayerPipe + 0: 10: ParallelTransformerLayerPipe + 0: 11: ParallelTransformerLayerPipe + 0: 12: ParallelTransformerLayerPipe + 0: 13: ParallelTransformerLayerPipe + 0: 14: ParallelTransformerLayerPipe + 0: 15: ParallelTransformerLayerPipe + 0: 16: ParallelTransformerLayerPipe + 0: 17: ParallelTransformerLayerPipe + 0: 18: ParallelTransformerLayerPipe + 0: 19: ParallelTransformerLayerPipe + 0: 20: ParallelTransformerLayerPipe + 0: 21: ParallelTransformerLayerPipe + 0: 22: ParallelTransformerLayerPipe + 0: 23: ParallelTransformerLayerPipe + 0: 24: ParallelTransformerLayerPipe + 0: 25: ParallelTransformerLayerPipe + 0: 26: ParallelTransformerLayerPipe + 0: 27: ParallelTransformerLayerPipe + 0: 28: ParallelTransformerLayerPipe + 0: 29: ParallelTransformerLayerPipe + 0: 30: ParallelTransformerLayerPipe + 0: 31: undo + 0: 32: MixedFusedLayerNorm + 0: 33: EmbeddingPipe + 0: 34: float16_to_fp32 + 0: loss: CrossEntropy + 0: [2023-05-13 00:59:36,873] [INFO] [utils.py:827:see_memory_usage] After Building Model + 0: [2023-05-13 00:59:36,874] [INFO] [utils.py:828:see_memory_usage] MA 3.56 GB Max_MA 3.56 GB CA 3.74 GB Max_CA 4 GB + 0: [2023-05-13 00:59:36,874] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 37.3 GB, percent = 7.4% + 0: setting training iterations to 0 + 0: > learning rate decay style: cosine + 0: DeepSpeed is enabled. + 0: [2023-05-13 00:59:36,876] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed info: version=0.7.5, git-hash=unknown, git-branch=unknown + 0: [2023-05-13 01:00:00,951] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Flops Profiler Enabled: False + 0: [2023-05-13 01:00:00,951] [INFO] [logging.py:68:log_dist] [Rank 0] Removing param_group that has no 'params' in the client Optimizer + 0: [2023-05-13 01:00:00,952] [INFO] [logging.py:68:log_dist] [Rank 0] Using client Optimizer as basic optimizer + 0: [2023-05-13 01:00:00,965] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Basic Optimizer = FusedAdam + 0: [2023-05-13 01:00:00,965] [INFO] [logging.py:68:log_dist] [Rank 0] Creating BF16 optimizer + 0: [2023-05-13 01:00:01,088] [INFO] [utils.py:827:see_memory_usage] begin bf16_optimizer + 0: [2023-05-13 01:00:01,089] [INFO] [utils.py:828:see_memory_usage] MA 3.55 GB Max_MA 3.57 GB CA 3.76 GB Max_CA 4 GB + 0: [2023-05-13 01:00:01,089] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.04 GB, percent = 7.6% + 0: ninja: no work to do. +23: Time to load utils op: 0.45098280906677246 secondsTime to load utils op: 0.45005035400390625 seconds +23: +23: Time to load utils op: 0.4507451057434082 seconds +23: Time to load utils op: 0.45041418075561523 seconds +23: Time to load utils op: 0.4504404067993164 secondsTime to load utils op: 0.45050573348999023 seconds +23: +23: Time to load utils op: 0.45047426223754883 seconds +23: Time to load utils op: 0.4505486488342285 seconds + 6: Time to load utils op: 0.4746849536895752 seconds + 6: Time to load utils op: 0.4741380214691162 seconds + 6: Time to load utils op: 0.4750986099243164 seconds + 6: Time to load utils op: 0.47348880767822266 seconds + 0: Time to load utils op: 0.4815225601196289 seconds + 0: Time to load utils op: 0.48127079010009766 seconds + 0: Time to load utils op: 0.48138999938964844 seconds + 6: Time to load utils op: 0.47403812408447266 seconds + 6: Time to load utils op: 0.47440409660339355 seconds +29: Time to load utils op: 0.4394822120666504 secondsTime to load utils op: 0.4394805431365967 seconds +29: +29: Time to load utils op: 0.43949270248413086 seconds +25: Time to load utils op: 0.4400007724761963 secondsTime to load utils op: 0.4400146007537842 seconds +25: +25: Time to load utils op: 0.4400289058685303 seconds + 0: Time to load utils op: 0.48133373260498047 seconds + 6: Time to load utils op: 0.4751608371734619 seconds + 6: Time to load utils op: 0.47562646865844727 seconds + 2: Time to load utils op: 0.47467732429504395 seconds + 2: Time to load utils op: 0.47469115257263184 seconds + 2: Time to load utils op: 0.47469282150268555 seconds + 1: Time to load utils op: 0.4748072624206543 secondsTime to load utils op: 0.4748094081878662 seconds + 1: + 1: Time to load utils op: 0.47493743896484375 secondsTime to load utils op: 0.4749312400817871 seconds + 1: + 1: Time to load utils op: 0.474959135055542 seconds + 0: Time to load utils op: 0.48116326332092285 seconds + 0: Time to load utils op: 0.4814307689666748 seconds + 0: Time to load utils op: 0.4822371006011963 seconds +11: Time to load utils op: 0.4674060344696045 secondsTime to load utils op: 0.4667544364929199 seconds +11: +11: Time to load utils op: 0.46720266342163086 seconds +11: Time to load utils op: 0.4667673110961914 seconds + 0: Time to load utils op: 0.48213911056518555 seconds + 7: Time to load utils op: 0.46634531021118164 secondsTime to load utils op: 0.46613264083862305 seconds + 7: +29: Time to load utils op: 0.4399240016937256 seconds +30: Time to load utils op: 0.44367265701293945 seconds +30: Time to load utils op: 0.44489264488220215 seconds +30: Time to load utils op: 0.4441239833831787 seconds +30: Time to load utils op: 0.44423484802246094 seconds +29: Time to load utils op: 0.4399986267089844 seconds +29: Time to load utils op: 0.4400036334991455 secondsTime to load utils op: 0.44001245498657227 seconds +29: +29: Time to load utils op: 0.44002723693847656 seconds +25: Time to load utils op: 0.4404489994049072 secondsTime to load utils op: 0.44043993949890137 seconds +25: +25: Time to load utils op: 0.44045519828796387 seconds +25: Time to load utils op: 0.4404630661010742 seconds +25: Time to load utils op: 0.44046735763549805 seconds + 4: Time to load utils op: 0.4716756343841553 secondsTime to load utils op: 0.4716804027557373 seconds + 4: + 4: Time to load utils op: 0.47171854972839355 seconds + 1: Time to load utils op: 0.4752681255340576 secondsTime to load utils op: 0.4752814769744873 seconds + 1: + 1: Time to load utils op: 0.4752845764160156 seconds +24: Time to load utils op: 0.4404025077819824 seconds +14: Time to load utils op: 0.4559919834136963 secondsTime to load utils op: 0.4559953212738037 seconds +14: +14: Time to load utils op: 0.4560229778289795 seconds +14: Time to load utils op: 0.4560515880584717 seconds + 2: Time to load utils op: 0.47516727447509766 seconds +13: Time to load utils op: 0.4431307315826416 secondsTime to load utils op: 0.44314122200012207 seconds +13: +13: Time to load utils op: 0.44295287132263184 seconds + 2: Time to load utils op: 0.4751873016357422 seconds +11: Time to load utils op: 0.46721696853637695 secondsTime to load utils op: 0.4679899215698242 secondsTime to load utils op: 0.4673147201538086 seconds +11: +11: +11: Time to load utils op: 0.468156099319458 seconds +24: Time to load utils op: 0.44041943550109863 secondsTime to load utils op: 0.4404335021972656 seconds +24: +24: Time to load utils op: 0.44042468070983887 seconds +19: Time to load utils op: 0.4427976608276367 seconds +27: Time to load utils op: 0.4395313262939453 secondsTime to load utils op: 0.43952155113220215 seconds +27: + 3: Time to load utils op: 0.47267985343933105 secondsTime to load utils op: 0.4726886749267578 seconds + 3: Time to load utils op: 0.47269725799560547 seconds + 3: + 2: Time to load utils op: 0.4751930236816406 secondsTime to load utils op: 0.4752037525177002 seconds + 2: +30: Time to load utils op: 0.44500136375427246 seconds +12: Time to load utils op: 0.46605539321899414 seconds + 2: Time to load utils op: 0.4752082824707031 seconds +15: Time to load utils op: 0.4539647102355957 seconds +15: Time to load utils op: 0.4539816379547119 seconds +15: Time to load utils op: 0.453995943069458 seconds +15: Time to load utils op: 0.4540259838104248 seconds +30: Time to load utils op: 0.44464564323425293 seconds + 7: Time to load utils op: 0.46616268157958984 seconds +30: Time to load utils op: 0.44536638259887695 seconds +17: Time to load utils op: 0.4434645175933838 seconds +17: Time to load utils op: 0.44347620010375977 seconds +17: Time to load utils op: 0.44349002838134766 seconds + 7: Time to load utils op: 0.4662954807281494 seconds +21: Time to load utils op: 0.4556155204772949 secondsTime to load utils op: 0.4555234909057617 seconds +21: +21: Time to load utils op: 0.45613598823547363 secondsTime to load utils op: 0.45528149604797363 seconds +21: +26: Time to load utils op: 0.44008946418762207 seconds +26: Time to load utils op: 0.4401078224182129 seconds +26: Time to load utils op: 0.44012951850891113 seconds +26: Time to load utils op: 0.44012975692749023 seconds +30: Time to load utils op: 0.4450998306274414 seconds +16: Time to load utils op: 0.4624361991882324 secondsTime to load utils op: 0.46227478981018066 seconds +16: +16: Time to load utils op: 0.4622626304626465 seconds + 4: Time to load utils op: 0.47215986251831055 seconds + 4: Time to load utils op: 0.4721651077270508 seconds + 4: Time to load utils op: 0.4721856117248535 seconds + 4: Time to load utils op: 0.4721798896789551 seconds + 4: Time to load utils op: 0.47219085693359375 seconds + 7: Time to load utils op: 0.46653199195861816 seconds +13: Time to load utils op: 0.4438176155090332 secondsTime to load utils op: 0.443814754486084 secondsTime to load utils op: 0.44379401206970215 secondsTime to load utils op: 0.44382143020629883 seconds +13: +13: +13: +13: Time to load utils op: 0.4438052177429199 seconds +14: Time to load utils op: 0.4566221237182617 secondsTime to load utils op: 0.4566197395324707 secondsTime to load utils op: 0.4566335678100586 seconds +14: +14: +14: Time to load utils op: 0.4566459655761719 seconds +10: Time to load utils op: 0.46469640731811523 secondsTime to load utils op: 0.46471309661865234 seconds +10: + 3: Time to load utils op: 0.4732086658477783 secondsTime to load utils op: 0.47322511672973633 secondsTime to load utils op: 0.4732167720794678 secondsTime to load utils op: 0.4732377529144287 seconds + 3: + 3: Time to load utils op: 0.4732372760772705 seconds + 3: + 3: +12: Time to load utils op: 0.46639418601989746 secondsTime to load utils op: 0.46634602546691895 seconds +10: Time to load utils op: 0.46475863456726074 seconds +18: Time to load utils op: 0.45029187202453613 secondsTime to load utils op: 0.45029711723327637 seconds +18: +18: Time to load utils op: 0.45032572746276855 seconds +18: Time to load utils op: 0.45035338401794434 seconds +15: Time to load utils op: 0.4546222686767578 seconds +15: Time to load utils op: 0.4546318054199219 seconds +15: Time to load utils op: 0.45464468002319336 seconds +28: Time to load utils op: 0.44043993949890137 secondsTime to load utils op: 0.4404482841491699 seconds +28: Time to load utils op: 0.440476655960083 seconds +28: +28: Time to load utils op: 0.440462589263916 seconds +12: +17: Time to load utils op: 0.4442174434661865 seconds +17: Time to load utils op: 0.44423675537109375 seconds +10: Time to load utils op: 0.4647653102874756 seconds +10: Time to load utils op: 0.4647798538208008 secondsTime to load utils op: 0.4647810459136963 seconds +10: +21: Time to load utils op: 0.4565696716308594 seconds + 8: Time to load utils op: 0.46715331077575684 secondsTime to load utils op: 0.46715593338012695 seconds + 8: + 8: Time to load utils op: 0.46717047691345215 seconds + 8: Time to load utils op: 0.46718382835388184 seconds +10: Time to load utils op: 0.4647865295410156 secondsTime to load utils op: 0.4647970199584961 seconds +10: +15: Time to load utils op: 0.4546535015106201 seconds +26: Time to load utils op: 0.44061732292175293 seconds +26: Time to load utils op: 0.44063687324523926 secondsTime to load utils op: 0.4406468868255615 seconds +26: + 9: Time to load utils op: 0.46733951568603516 seconds + 9: Time to load utils op: 0.46733522415161133 seconds + 9: Time to load utils op: 0.4673473834991455 seconds + 7: Time to load utils op: 0.46686577796936035 secondsTime to load utils op: 0.4668710231781006 secondsTime to load utils op: 0.46685338020324707 seconds + 7: + 7: +21: Time to load utils op: 0.455533504486084 seconds +19: Time to load utils op: 0.4428086280822754 seconds +16: Time to load utils op: 0.46216392517089844 seconds +16: Time to load utils op: 0.462571382522583 secondsTime to load utils op: 0.462860107421875 seconds +16: Time to load utils op: 0.4623901844024658 seconds +16: +16: Time to load utils op: 0.4619019031524658 seconds +17: Time to load utils op: 0.44420719146728516 seconds +17: Time to load utils op: 0.44426488876342773 seconds +17: Time to load utils op: 0.4442741870880127 seconds +21: Time to load utils op: 0.4561178684234619 seconds +26: Time to load utils op: 0.44066905975341797 seconds +19: Time to load utils op: 0.4428393840789795 secondsTime to load utils op: 0.4428236484527588 seconds +19: +21: Time to load utils op: 0.4563610553741455 seconds +31: Time to load utils op: 0.4385406970977783 seconds +31: Time to load utils op: 0.4384794235229492 seconds + 9: Time to load utils op: 0.46739912033081055 seconds + 9: Time to load utils op: 0.4674105644226074 secondsTime to load utils op: 0.46741414070129395 seconds + 9: + 9: Time to load utils op: 0.46741390228271484 seconds + 9: Time to load utils op: 0.46742701530456543 seconds +27: Time to load utils op: 0.4395577907562256 seconds +20: Time to load utils op: 0.44292354583740234 seconds +20: Time to load utils op: 0.4429914951324463 seconds +20: Time to load utils op: 0.44301557540893555 seconds +12: Time to load utils op: 0.4664294719696045 seconds +18: Time to load utils op: 0.45110177993774414 secondsTime to load utils op: 0.45111966133117676 seconds +18: +31: Time to load utils op: 0.4386143684387207 seconds +19: Time to load utils op: 0.44336724281311035 secondsTime to load utils op: 0.4433720111846924 seconds +19: +28: Time to load utils op: 0.4419059753417969 secondsTime to load utils op: 0.44206929206848145 seconds +28: + 5: Time to load utils op: 0.4716770648956299 secondsTime to load utils op: 0.47168660163879395 seconds + 5: + 5: Time to load utils op: 0.47170138359069824 seconds + 5: Time to load utils op: 0.4717142581939697 seconds +31: Time to load utils op: 0.43863487243652344 seconds +12: Time to load utils op: 0.4665842056274414 seconds + 8: Time to load utils op: 0.46772217750549316 secondsTime to load utils op: 0.4677262306213379 seconds + 8: +18: Time to load utils op: 0.4511291980743408 seconds +18: Time to load utils op: 0.4511392116546631 seconds +31: Time to load utils op: 0.4386465549468994 secondsTime to load utils op: 0.4386568069458008 seconds +31: Time to load utils op: 0.4386630058288574 secondsTime to load utils op: 0.4386618137359619 seconds +31: +31: +19: Time to load utils op: 0.4433786869049072 seconds +12: Time to load utils op: 0.466625452041626 seconds +12: Time to load utils op: 0.46677494049072266 seconds +24: Time to load utils op: 0.4411177635192871 seconds +19: Time to load utils op: 0.44339728355407715 seconds +28: Time to load utils op: 0.44090723991394043 seconds +28: Time to load utils op: 0.4410436153411865 seconds +12: Time to load utils op: 0.4666152000427246 seconds + 8: Time to load utils op: 0.46775150299072266 seconds + 5: Time to load utils op: 0.4717411994934082 seconds + 5: Time to load utils op: 0.47174620628356934 secondsTime to load utils op: 0.47174572944641113 seconds + 5: +27: Time to load utils op: 0.44016003608703613 seconds +27: Time to load utils op: 0.44019103050231934 seconds +20: Time to load utils op: 0.4435746669769287 secondsTime to load utils op: 0.44358229637145996 seconds +20: + 8: Time to load utils op: 0.46776866912841797 seconds + 5: Time to load utils op: 0.47176146507263184 seconds +22: Time to load utils op: 0.4434621334075928 secondsTime to load utils op: 0.443758487701416 seconds +22: +22: Time to load utils op: 0.4439258575439453 secondsTime to load utils op: 0.4439074993133545 seconds +22: +24: Time to load utils op: 0.44113850593566895 seconds +24: Time to load utils op: 0.4411506652832031 seconds +24: Time to load utils op: 0.44115710258483887 seconds +27: Time to load utils op: 0.4401984214782715 seconds +27: Time to load utils op: 0.4402499198913574 seconds +20: Time to load utils op: 0.44364023208618164 seconds +27: Time to load utils op: 0.44026708602905273 seconds +20: Time to load utils op: 0.44365501403808594 seconds +20: Time to load utils op: 0.44366931915283203 seconds +22: Time to load utils op: 0.4447455406188965 secondsTime to load utils op: 0.44475579261779785 secondsTime to load utils op: 0.4447615146636963 seconds +22: +22: +22: Time to load utils op: 0.4447927474975586 seconds + 0: [2023-05-13 01:00:01,685] [INFO] [utils.py:827:see_memory_usage] before initializing group 0 + 0: [2023-05-13 01:00:01,685] [INFO] [utils.py:828:see_memory_usage] MA 3.55 GB Max_MA 3.55 GB CA 3.76 GB Max_CA 4 GB + 0: [2023-05-13 01:00:01,685] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.06 GB, percent = 7.6% +21: Time to load utils op: 0.0005781650543212891 seconds +21: Time to load utils op: 0.0005819797515869141 seconds +21: Time to load utils op: 0.0005564689636230469 seconds +21: Time to load utils op: 0.0005736351013183594 seconds +21: Time to load utils op: 0.0006535053253173828 seconds +21: Time to load utils op: 0.0006430149078369141 seconds +21: Time to load utils op: 0.00069427490234375 seconds +21: Time to load utils op: 0.0007390975952148438 seconds + 0: Time to load utils op: 0.0011103153228759766 seconds + 0: Time to load utils op: 0.0012519359588623047 secondsTime to load utils op: 0.0011763572692871094 seconds + 0: + 0: Time to load utils op: 0.0012297630310058594 seconds + 0: Time to load utils op: 0.0014526844024658203 secondsTime to load utils op: 0.0014088153839111328 seconds + 0: + 0: Time to load utils op: 0.0014662742614746094 seconds +12: Time to load utils op: 0.0011928081512451172 seconds +12: Time to load utils op: 0.0015063285827636719 seconds +12: Time to load utils op: 0.0015554428100585938 seconds +12: Time to load utils op: 0.001832723617553711 seconds +12: Time to load utils op: 0.0019791126251220703 seconds +12: Time to load utils op: 0.0014750957489013672 seconds +12: Time to load utils op: 0.0015676021575927734 seconds +12: Time to load utils op: 0.0015385150909423828 seconds +16: Time to load utils op: 0.0006172657012939453 seconds +16: Time to load utils op: 0.0007355213165283203 secondsTime to load utils op: 0.0007405281066894531 secondsTime to load utils op: 0.0007052421569824219 seconds +16: +16: Time to load utils op: 0.0007107257843017578 seconds +16: +16: Time to load utils op: 0.0007295608520507812 seconds +16: Time to load utils op: 0.0007305145263671875 seconds +16: Time to load utils op: 0.0006892681121826172 seconds +30: Time to load utils op: 0.0005459785461425781 seconds +30: Time to load utils op: 0.000408172607421875 seconds +30: Time to load utils op: 0.00039005279541015625 seconds +30: Time to load utils op: 0.00038743019104003906 seconds +30: Time to load utils op: 0.0009255409240722656 seconds +30: Time to load utils op: 0.0009016990661621094 seconds +30: Time to load utils op: 0.0008955001831054688 seconds +30: Time to load utils op: 0.0009217262268066406 seconds + 0: [2023-05-13 01:00:01,900] [INFO] [utils.py:827:see_memory_usage] after initializing group 0 + 0: [2023-05-13 01:00:01,901] [INFO] [utils.py:828:see_memory_usage] MA 7.26 GB Max_MA 7.26 GB CA 9.3 GB Max_CA 9 GB + 0: [2023-05-13 01:00:01,901] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.19 GB, percent = 7.6% +25: Time to load utils op: 0.0005733966827392578 seconds +25: Time to load utils op: 0.0003426074981689453 seconds +25: Time to load utils op: 0.0006930828094482422 seconds + 8: Time to load utils op: 0.0008602142333984375 seconds +25: Time to load utils op: 0.00046634674072265625 secondsTime to load utils op: 0.00043582916259765625 secondsTime to load utils op: 0.0004878044128417969 secondsTime to load utils op: 0.0004477500915527344 secondsTime to load utils op: 0.00044798851013183594 seconds +25: +25: +25: +25: + 1: Time to load utils op: 0.00119781494140625 seconds +10: Time to load utils op: 0.0008745193481445312 seconds +14: Time to load utils op: 0.000736236572265625 seconds +11: Time to load utils op: 0.0007121562957763672 seconds +13: Time to load utils op: 0.0009069442749023438 seconds +13: Time to load utils op: 0.0009171962738037109 seconds + 1: Time to load utils op: 0.001409292221069336 secondsTime to load utils op: 0.001207590103149414 seconds + 1: + 1: Time to load utils op: 0.0013666152954101562 secondsTime to load utils op: 0.0014290809631347656 seconds + 8: Time to load utils op: 0.0010786056518554688 seconds + 1: +11: Time to load utils op: 0.0008573532104492188 seconds +10: Time to load utils op: 0.0008883476257324219 secondsTime to load utils op: 0.0008859634399414062 seconds +10: +14: Time to load utils op: 0.0007240772247314453 seconds + 1: Time to load utils op: 0.0014383792877197266 secondsTime to load utils op: 0.0014030933380126953 seconds + 1: +11: Time to load utils op: 0.0008604526519775391 seconds +13: Time to load utils op: 0.0009291172027587891 secondsTime to load utils op: 0.0009751319885253906 secondsTime to load utils op: 0.0009164810180664062 seconds +13: +13: +13: Time to load utils op: 0.0009179115295410156 seconds +13: Time to load utils op: 0.0008993148803710938 seconds +14: Time to load utils op: 0.0007448196411132812 seconds +10: Time to load utils op: 0.0008497238159179688 secondsTime to load utils op: 0.0008640289306640625 seconds +10: +14: Time to load utils op: 0.0006952285766601562 seconds +15: Time to load utils op: 0.0012924671173095703 seconds +10: Time to load utils op: 0.0008866786956787109 seconds +10: Time to load utils op: 0.000858306884765625 seconds +10: Time to load utils op: 0.0009276866912841797 seconds + 8: Time to load utils op: 0.0012743473052978516 secondsTime to load utils op: 0.0009768009185791016 seconds + 8: + 8: Time to load utils op: 0.0009758472442626953 seconds + 8: Time to load utils op: 0.0010144710540771484 seconds + 8: Time to load utils op: 0.0010080337524414062 seconds +29: Time to load utils op: 0.0007991790771484375 seconds +29: Time to load utils op: 0.0007364749908447266 seconds +29: Time to load utils op: 0.0007634162902832031 seconds +29: Time to load utils op: 0.0007748603820800781 seconds +29: Time to load utils op: 0.0008296966552734375 seconds +27: Time to load utils op: 0.0011174678802490234 seconds +13: Time to load utils op: 0.0016584396362304688 seconds +26: Time to load utils op: 0.0009465217590332031 seconds +29: Time to load utils op: 0.0011088848114013672 seconds +14: Time to load utils op: 0.001447439193725586 seconds +27: Time to load utils op: 0.0011188983917236328 secondsTime to load utils op: 0.0010895729064941406 seconds +27: + 1: Time to load utils op: 0.0020558834075927734 seconds +11: Time to load utils op: 0.0014607906341552734 seconds + 8: Time to load utils op: 0.0016074180603027344 seconds +27: Time to load utils op: 0.0012242794036865234 seconds +17: Time to load utils op: 0.0013473033905029297 seconds +26: Time to load utils op: 0.0011332035064697266 seconds +27: Time to load utils op: 0.001190185546875 secondsTime to load utils op: 0.0011925697326660156 seconds +27: +11: Time to load utils op: 0.0016736984252929688 seconds + 3: Time to load utils op: 0.0015399456024169922 seconds +22: Time to load utils op: 0.001377105712890625 seconds +29: Time to load utils op: 0.0010862350463867188 seconds +27: Time to load utils op: 0.0013873577117919922 seconds +29: Time to load utils op: 0.0011320114135742188 seconds +26: Time to load utils op: 0.0012483596801757812 seconds +27: Time to load utils op: 0.0015406608581542969 seconds +26: Time to load utils op: 0.0012242794036865234 seconds + 3: Time to load utils op: 0.0016050338745117188 seconds + 2: Time to load utils op: 0.0021903514862060547 seconds +17: Time to load utils op: 0.0014553070068359375 secondsTime to load utils op: 0.0014584064483642578 seconds +17: +15: Time to load utils op: 0.0024619102478027344 seconds +26: Time to load utils op: 0.0013768672943115234 seconds +14: Time to load utils op: 0.0019795894622802734 seconds + 7: Time to load utils op: 0.0016090869903564453 seconds +26: Time to load utils op: 0.0014259815216064453 secondsTime to load utils op: 0.0014116764068603516 seconds +26: +24: Time to load utils op: 0.0026464462280273438 seconds +20: Time to load utils op: 0.0018181800842285156 seconds +17: Time to load utils op: 0.0015375614166259766 seconds +14: Time to load utils op: 0.0020499229431152344 seconds +18: Time to load utils op: 0.0024137496948242188 seconds +26: Time to load utils op: 0.0015740394592285156 seconds +28: Time to load utils op: 0.0018885135650634766 seconds +22: Time to load utils op: 0.0020592212677001953 seconds + 3: Time to load utils op: 0.0021085739135742188 seconds +23: Time to load utils op: 0.0021102428436279297 seconds +23: Time to load utils op: 0.002123594284057617 seconds +20: Time to load utils op: 0.0020580291748046875 seconds +17: Time to load utils op: 0.0019867420196533203 seconds +23: Time to load utils op: 0.002178192138671875 seconds +22: Time to load utils op: 0.0025107860565185547 seconds + 9: Time to load utils op: 0.002638101577758789 seconds + 5: Time to load utils op: 0.0024552345275878906 seconds + 5: Time to load utils op: 0.0024979114532470703 seconds +11: Time to load utils op: 0.002980947494506836 seconds + 5: Time to load utils op: 0.0024955272674560547 seconds +11: Time to load utils op: 0.003068208694458008 seconds + 6: Time to load utils op: 0.002853870391845703 seconds + 3: Time to load utils op: 0.0029153823852539062 seconds + 9: Time to load utils op: 0.0029103755950927734 seconds + 9: Time to load utils op: 0.003040313720703125 seconds + 9: Time to load utils op: 0.003001689910888672 seconds + 3: Time to load utils op: 0.003048419952392578 seconds + 4: Time to load utils op: 0.003312349319458008 seconds +11: Time to load utils op: 0.0034422874450683594 seconds +19: Time to load utils op: 0.0026934146881103516 seconds +14: Time to load utils op: 0.0032258033752441406 seconds +23: Time to load utils op: 0.0031020641326904297 seconds + 9: Time to load utils op: 0.003141164779663086 seconds +20: Time to load utils op: 0.0028192996978759766 seconds +17: Time to load utils op: 0.0026712417602539062 seconds +20: Time to load utils op: 0.002852916717529297 seconds +17: Time to load utils op: 0.003216266632080078 seconds + 6: Time to load utils op: 0.003016948699951172 seconds +20: Time to load utils op: 0.0029366016387939453 seconds +19: Time to load utils op: 0.002847909927368164 seconds +20: Time to load utils op: 0.0028181076049804688 seconds +19: Time to load utils op: 0.002862215042114258 seconds +19: Time to load utils op: 0.0029430389404296875 seconds +22: Time to load utils op: 0.003459930419921875 seconds + 2: Time to load utils op: 0.0040149688720703125 seconds +15: Time to load utils op: 0.0041351318359375 seconds +18: Time to load utils op: 0.003949880599975586 seconds +31: Time to load utils op: 0.0036563873291015625 seconds + 6: Time to load utils op: 0.003464937210083008 seconds +17: Time to load utils op: 0.0033431053161621094 seconds +23: Time to load utils op: 0.003531217575073242 seconds +15: Time to load utils op: 0.004258155822753906 seconds +28: Time to load utils op: 0.003413677215576172 seconds + 4: Time to load utils op: 0.0038559436798095703 seconds +23: Time to load utils op: 0.003572702407836914 seconds +31: Time to load utils op: 0.0038614273071289062 secondsTime to load utils op: 0.0038008689880371094 seconds +31: +15: Time to load utils op: 0.004246234893798828 seconds +15: Time to load utils op: 0.004233360290527344 seconds +24: Time to load utils op: 0.004462718963623047 seconds +23: Time to load utils op: 0.0036907196044921875 seconds +15: Time to load utils op: 0.004286050796508789 seconds +23: Time to load utils op: 0.003643035888671875 seconds +15: Time to load utils op: 0.004296302795410156 seconds +22: Time to load utils op: 0.0038573741912841797 seconds + 2: Time to load utils op: 0.00435328483581543 seconds + 7: Time to load utils op: 0.0036771297454833984 seconds +22: Time to load utils op: 0.003825664520263672 seconds + 9: Time to load utils op: 0.003932952880859375 secondsTime to load utils op: 0.0039327144622802734 seconds + 9: +22: Time to load utils op: 0.0037789344787597656 seconds +22: Time to load utils op: 0.0038595199584960938 seconds + 9: Time to load utils op: 0.003975868225097656 seconds +31: Time to load utils op: 0.004118919372558594 seconds +20: Time to load utils op: 0.0038750171661376953 seconds +19: Time to load utils op: 0.0037021636962890625 seconds +20: Time to load utils op: 0.0038657188415527344 seconds +31: Time to load utils op: 0.0039997100830078125 seconds + 2: Time to load utils op: 0.004591464996337891 seconds +31: Time to load utils op: 0.004179477691650391 seconds +19: Time to load utils op: 0.003702878952026367 seconds +19: Time to load utils op: 0.003709554672241211 seconds +31: Time to load utils op: 0.003936767578125 seconds +19: Time to load utils op: 0.003751993179321289 seconds +28: Time to load utils op: 0.003838777542114258 seconds +24: Time to load utils op: 0.005117893218994141 seconds + 3: Time to load utils op: 0.004161357879638672 secondsTime to load utils op: 0.0041081905364990234 seconds + 3: + 3: Time to load utils op: 0.004168510437011719 seconds +31: Time to load utils op: 0.004032611846923828 seconds +28: Time to load utils op: 0.003927946090698242 seconds + 2: Time to load utils op: 0.004647731781005859 seconds + 2: Time to load utils op: 0.004714012145996094 seconds + 2: Time to load utils op: 0.004723310470581055 seconds +28: Time to load utils op: 0.0038728713989257812 seconds + 5: Time to load utils op: 0.0039119720458984375 seconds +28: Time to load utils op: 0.004019737243652344 seconds +28: Time to load utils op: 0.0038678646087646484 seconds + 5: Time to load utils op: 0.004018068313598633 seconds +28: Time to load utils op: 0.0038900375366210938 seconds + 6: Time to load utils op: 0.004145145416259766 seconds + 6: Time to load utils op: 0.004166603088378906 seconds + 5: Time to load utils op: 0.003969907760620117 seconds + 5: Time to load utils op: 0.004009723663330078 seconds + 2: Time to load utils op: 0.00489044189453125 seconds +24: Time to load utils op: 0.005121707916259766 seconds + 6: Time to load utils op: 0.004232645034790039 secondsTime to load utils op: 0.004170417785644531 secondsTime to load utils op: 0.004174947738647461 seconds + 6: + 6: + 5: Time to load utils op: 0.004117250442504883 seconds +24: Time to load utils op: 0.005091428756713867 seconds + 4: Time to load utils op: 0.004560708999633789 secondsTime to load utils op: 0.004587411880493164 seconds + 4: + 4: Time to load utils op: 0.004710197448730469 seconds + 4: Time to load utils op: 0.004723548889160156 seconds + 7: Time to load utils op: 0.004357337951660156 seconds +24: Time to load utils op: 0.005127668380737305 seconds + 4: Time to load utils op: 0.00462651252746582 seconds + 4: Time to load utils op: 0.0046329498291015625 seconds +24: Time to load utils op: 0.005212306976318359 seconds + 7: Time to load utils op: 0.0042877197265625 seconds +18: Time to load utils op: 0.0046312808990478516 seconds +18: Time to load utils op: 0.00463557243347168 seconds + 7: Time to load utils op: 0.004361867904663086 seconds +18: Time to load utils op: 0.004641532897949219 seconds +24: Time to load utils op: 0.0053789615631103516 seconds + 7: Time to load utils op: 0.004300355911254883 secondsTime to load utils op: 0.004311800003051758 seconds + 7: + 7: Time to load utils op: 0.0042836666107177734 seconds +18: Time to load utils op: 0.0046770572662353516 seconds +18: Time to load utils op: 0.0050694942474365234 seconds +18: Time to load utils op: 0.005049228668212891 seconds + 0: [2023-05-13 01:00:02,010] [INFO] [utils.py:827:see_memory_usage] before initializing group 1 + 0: [2023-05-13 01:00:02,010] [INFO] [utils.py:828:see_memory_usage] MA 7.26 GB Max_MA 7.26 GB CA 9.3 GB Max_CA 9 GB + 0: [2023-05-13 01:00:02,010] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.24 GB, percent = 7.6% + 0: [2023-05-13 01:00:02,120] [INFO] [utils.py:827:see_memory_usage] after initializing group 1 + 0: [2023-05-13 01:00:02,120] [INFO] [utils.py:828:see_memory_usage] MA 10.67 GB Max_MA 10.67 GB CA 14.4 GB Max_CA 14 GB + 0: [2023-05-13 01:00:02,120] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.25 GB, percent = 7.6% + 0: [2023-05-13 01:00:02,225] [INFO] [utils.py:827:see_memory_usage] before initializing group 2 + 0: [2023-05-13 01:00:02,225] [INFO] [utils.py:828:see_memory_usage] MA 10.67 GB Max_MA 10.67 GB CA 14.4 GB Max_CA 14 GB + 0: [2023-05-13 01:00:02,225] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.25 GB, percent = 7.6% + 0: [2023-05-13 01:00:02,333] [INFO] [utils.py:827:see_memory_usage] after initializing group 2 + 0: [2023-05-13 01:00:02,334] [INFO] [utils.py:828:see_memory_usage] MA 10.68 GB Max_MA 10.68 GB CA 14.4 GB Max_CA 14 GB + 0: [2023-05-13 01:00:02,334] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.25 GB, percent = 7.6% + 0: [2023-05-13 01:00:02,438] [INFO] [utils.py:827:see_memory_usage] before initialize_optimizer + 0: [2023-05-13 01:00:02,439] [INFO] [utils.py:828:see_memory_usage] MA 10.68 GB Max_MA 10.68 GB CA 14.4 GB Max_CA 14 GB + 0: [2023-05-13 01:00:02,439] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.25 GB, percent = 7.6% + 0: [2023-05-13 01:00:02,549] [INFO] [utils.py:827:see_memory_usage] end initialize_optimizer + 0: [2023-05-13 01:00:02,550] [INFO] [utils.py:828:see_memory_usage] MA 10.73 GB Max_MA 10.73 GB CA 14.4 GB Max_CA 14 GB + 0: [2023-05-13 01:00:02,550] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.25 GB, percent = 7.6% + 0: [2023-05-13 01:00:02,655] [INFO] [utils.py:827:see_memory_usage] end bf16_optimizer + 0: [2023-05-13 01:00:02,656] [INFO] [utils.py:828:see_memory_usage] MA 10.73 GB Max_MA 10.73 GB CA 14.4 GB Max_CA 14 GB + 0: [2023-05-13 01:00:02,656] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.25 GB, percent = 7.6% + 0: [2023-05-13 01:00:02,656] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Final Optimizer = FusedAdam + 0: [2023-05-13 01:00:02,656] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed using client LR scheduler + 0: [2023-05-13 01:00:02,656] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed LR Scheduler = + 0: [2023-05-13 01:00:02,656] [INFO] [logging.py:68:log_dist] [Rank 0] step=0, skipped=0, lr=[0.0002, 0.0002, 0.0002], mom=[(0.9, 0.999), (0.9, 0.999), (0.9, 0.999)] + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1007:print] DeepSpeedEngine configuration: + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1011:print] activation_checkpointing_config { + 0: "partition_activations": false, + 0: "contiguous_memory_optimization": false, + 0: "cpu_checkpointing": false, + 0: "number_checkpoints": null, + 0: "synchronize_checkpoint_boundary": false, + 0: "profile": false + 0: } + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1011:print] aio_config ................... {'block_size': 1048576, 'queue_depth': 8, 'thread_count': 1, 'single_submit': False, 'overlap_events': True} + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1011:print] amp_enabled .................. False + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1011:print] amp_params ................... False + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1011:print] autotuning_config ............ { + 0: "enabled": false, + 0: "start_step": null, + 0: "end_step": null, + 0: "metric_path": null, + 0: "arg_mappings": null, + 0: "metric": "throughput", + 0: "model_info": null, + 0: "results_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_results", + 0: "exps_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_exps", + 0: "overwrite": true, + 0: "fast": true, + 0: "start_profile_step": 3, + 0: "end_profile_step": 5, + 0: "tuner_type": "gridsearch", + 0: "tuner_early_stopping": 5, + 0: "tuner_num_trials": 50, + 0: "model_info_path": null, + 0: "mp_size": 1, + 0: "max_train_batch_size": null, + 0: "min_train_batch_size": 1, + 0: "max_train_micro_batch_size_per_gpu": 1.024000e+03, + 0: "min_train_micro_batch_size_per_gpu": 1, + 0: "num_tuning_micro_batch_sizes": 3 + 0: } + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1011:print] bfloat16_enabled ............. True + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1011:print] checkpoint_parallel_write_pipeline False + 0: [2023-05-13 01:00:02,657] [INFO] [config.py:1011:print] checkpoint_tag_validation_enabled True + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] checkpoint_tag_validation_fail False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] comms_config ................. + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] communication_data_type ...... None + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] compression_config ........... {'weight_quantization': {'shared_parameters': {'enabled': False, 'quantizer_kernel': False, 'schedule_offset': 0, 'quantize_groups': 1, 'quantize_verbose': False, 'quantization_type': 'symmetric', 'quantize_weight_in_forward': False, 'rounding': 'nearest', 'fp16_mixed_quantize': False, 'quantize_change_ratio': 0.001}, 'different_groups': {}}, 'activation_quantization': {'shared_parameters': {'enabled': False, 'quantization_type': 'symmetric', 'range_calibration': 'dynamic', 'schedule_offset': 1000}, 'different_groups': {}}, 'sparse_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'row_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'head_pruning': {'shared_parameters': {'enabled': False, 'method': 'topk', 'schedule_offset': 1000}, 'different_groups': {}}, 'channel_pruning': {'shared_pa + 0: rameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'layer_reduction': {'enabled': False}} + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] curriculum_enabled ........... False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] curriculum_params ............ False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] dataloader_drop_last ......... False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] disable_allgather ............ False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] dump_state ................... False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] dynamic_loss_scale_args ...... None + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] eigenvalue_enabled ........... False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] eigenvalue_gas_boundary_resolution 1 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] eigenvalue_layer_name ........ bert.encoder.layer + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] eigenvalue_layer_num ......... 0 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] eigenvalue_max_iter .......... 100 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] eigenvalue_stability ......... 1e-06 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] eigenvalue_tol ............... 0.01 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] eigenvalue_verbose ........... False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] elasticity_enabled ........... False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] flops_profiler_config ........ { + 0: "enabled": false, + 0: "profile_step": 1, + 0: "module_depth": -1, + 0: "top_modules": 1, + 0: "detailed": true, + 0: "output_file": null + 0: } + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] fp16_auto_cast ............... None + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] fp16_enabled ................. False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] fp16_master_weights_and_gradients False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] global_rank .................. 0 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] gradient_accumulation_steps .. 1 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] gradient_clipping ............ 1.0 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] gradient_predivide_factor .... 1.0 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] initial_dynamic_scale ........ 1 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] load_universal_checkpoint .... False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] loss_scale ................... 1.0 + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] memory_breakdown ............. False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] monitor_config ............... + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] nebula_config ................ { + 0: "enabled": false, + 0: "persistent_storage_path": null, + 0: "persistent_time_interval": 100, + 0: "num_of_version_in_retention": 2, + 0: "enable_nebula_load": true, + 0: "load_path": null + 0: } + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] optimizer_legacy_fusion ...... False + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] optimizer_name ............... None + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] optimizer_params ............. None + 0: [2023-05-13 01:00:02,658] [INFO] [config.py:1011:print] pipeline ..................... {'stages': 'auto', 'partition': 'best', 'seed_layers': False, 'activation_checkpoint_interval': 0} + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] pld_enabled .................. False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] pld_params ................... False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] prescale_gradients ........... False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] scheduler_name ............... None + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] scheduler_params ............. None + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] sparse_attention ............. None + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] sparse_gradients_enabled ..... False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] steps_per_print .............. 2000 + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] train_batch_size ............. 512 + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] train_micro_batch_size_per_gpu 2 + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] use_node_local_storage ....... False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] wall_clock_breakdown ......... False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] world_size ................... 256 + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] zero_allow_untested_optimizer False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] zero_config .................. stage=0 contiguous_gradients=True reduce_scatter=True reduce_bucket_size=500000000 allgather_partitions=True allgather_bucket_size=500000000 overlap_comm=False load_from_fp32_weights=True elastic_checkpoint=False offload_param=None offload_optimizer=None sub_group_size=1000000000 cpu_offload_param=None cpu_offload_use_pin_memory=None cpu_offload=None prefetch_bucket_size=50000000 param_persistence_threshold=100000 model_persistence_threshold=9223372036854775807 max_live_parameters=1000000000 max_reuse_distance=1000000000 gather_16bit_weights_on_model_save=False stage3_gather_fp16_weights_on_model_save=False ignore_unused_parameters=True legacy_stage1=False round_robin_gradients=False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] zero_enabled ................. False + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:1011:print] zero_optimization_stage ...... 0 + 0: [2023-05-13 01:00:02,659] [INFO] [config.py:996:print_user_config] json = { + 0: "train_micro_batch_size_per_gpu": 2, + 0: "train_batch_size": 512, + 0: "gradient_clipping": 1.0, + 0: "zero_optimization": { + 0: "stage": 0 + 0: }, + 0: "bf16": { + 0: "enabled": true + 0: }, + 0: "steps_per_print": 2.000000e+03, + 0: "wall_clock_breakdown": false + 0: } + 0: Time to load utils op: 0.00042629241943359375 seconds + 0: [2023-05-13 01:00:02,660] [INFO] [engine.py:87:__init__] CONFIG: micro_batches=1 micro_batch_size=2 + 0: [2023-05-13 01:00:02,722] [INFO] [engine.py:145:__init__] RANK=0 STAGE=0 LAYERS=35 [0, 35) STAGE_PARAMS=1905090048 (1905.090M) TOTAL_PARAMS=1905090048 (1905.090M) UNIQUE_PARAMS=1905090048 (1905.090M) +24: [2023-05-13 01:00:02,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 0: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +21: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +22: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +22: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +31: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +20: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +20: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +31: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +12: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +16: [2023-05-13 01:00:02,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +12: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +19: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +24: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 9: [2023-05-13 01:00:02,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +18: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +15: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 7: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +18: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +26: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +10: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 6: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +11: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +29: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +28: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:02,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +25: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +25: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 7: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +14: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:02,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +23: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +16: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +23: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +27: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +30: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 5: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 2: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... +13: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +27: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt... + 4: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:02,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 4: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +19: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 8: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 2: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +24: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +28: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +29: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 6: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +11: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +15: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 5: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +17: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 1: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. +13: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:02,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:02,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/mp_rank_00_model_states.pt. + 3: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:02,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:03,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:03,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:03,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:03,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:03,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:03,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:03,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:03,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:03,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:03,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:03,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +11: [2023-05-13 01:00:03,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:03,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +20: [2023-05-13 01:00:03,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:03,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +15: [2023-05-13 01:00:03,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:03,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +24: [2023-05-13 01:00:03,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:03,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +18: [2023-05-13 01:00:03,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:03,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:03,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:03,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:03,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:03,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:03,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:03,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:03,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:03,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +29: [2023-05-13 01:00:03,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:03,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:03,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +31: [2023-05-13 01:00:03,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:03,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:03,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:03,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +25: [2023-05-13 01:00:03,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:03,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:03,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:03,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:03,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +28: [2023-05-13 01:00:03,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:03,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:03,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:03,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:03,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +12: [2023-05-13 01:00:03,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:03,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:03,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +10: [2023-05-13 01:00:03,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:03,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:03,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +17: [2023-05-13 01:00:03,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +14: [2023-05-13 01:00:03,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +23: [2023-05-13 01:00:03,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:03,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:03,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:03,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +14: [2023-05-13 01:00:03,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:03,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:03,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:03,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:03,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:03,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +13: [2023-05-13 01:00:03,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +22: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +22: [2023-05-13 01:00:03,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:03,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:03,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:03,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:03,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +26: [2023-05-13 01:00:03,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:03,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:03,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:03,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:03,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:03,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +21: [2023-05-13 01:00:03,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +27: [2023-05-13 01:00:03,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +16: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +30: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +27: [2023-05-13 01:00:03,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +19: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... +30: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:03,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:03,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 8: [2023-05-13 01:00:03,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:03,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:03,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 2: [2023-05-13 01:00:03,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:03,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:03,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:03,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:03,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:03,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:03,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:03,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:03,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +23: [2023-05-13 01:00:03,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:03,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +16: [2023-05-13 01:00:03,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:03,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:03,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +19: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:03,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:03,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +26: [2023-05-13 01:00:03,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:03,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:03,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:03,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:03,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +25: [2023-05-13 01:00:03,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 7: [2023-05-13 01:00:03,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:03,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:03,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 5: [2023-05-13 01:00:03,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:03,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:03,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:03,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:03,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:03,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:03,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:03,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +11: [2023-05-13 01:00:03,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:03,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +31: [2023-05-13 01:00:03,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:03,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:03,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:03,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:03,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:03,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:03,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:03,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:03,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:03,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:03,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:03,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +29: [2023-05-13 01:00:03,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +18: [2023-05-13 01:00:03,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 1: [2023-05-13 01:00:03,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +12: [2023-05-13 01:00:03,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:03,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:03,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +24: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:03,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:03,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +15: [2023-05-13 01:00:03,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:03,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:03,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 9: [2023-05-13 01:00:03,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:03,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:03,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:03,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:03,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:03,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:03,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +28: [2023-05-13 01:00:03,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +20: [2023-05-13 01:00:03,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:03,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:03,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:03,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +21: [2023-05-13 01:00:03,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +17: [2023-05-13 01:00:03,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 3: [2023-05-13 01:00:03,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +10: [2023-05-13 01:00:03,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:03,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 4: [2023-05-13 01:00:03,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. +13: [2023-05-13 01:00:03,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 6: [2023-05-13 01:00:03,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:03,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:03,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:03,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:03,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_01-model_00-model_states.pt. + 0: [2023-05-13 01:00:03,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:03,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:03,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:03,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:03,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:03,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:03,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:03,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:03,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:03,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:03,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:03,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:03,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:03,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:03,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:03,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:03,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:03,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:03,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:03,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:03,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:03,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:03,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:03,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:03,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:03,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:04,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +19: [2023-05-13 01:00:04,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:04,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:04,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:04,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:04,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:04,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:04,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:04,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:04,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +16: [2023-05-13 01:00:04,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +26: [2023-05-13 01:00:04,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:04,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:04,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:04,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:04,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:04,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:04,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +19: [2023-05-13 01:00:04,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +26: [2023-05-13 01:00:04,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:04,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:04,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:04,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:04,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:04,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +18: [2023-05-13 01:00:04,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +16: [2023-05-13 01:00:04,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:04,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:04,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +10: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:04,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:04,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:04,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:04,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:04,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:04,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:04,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:04,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:04,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:04,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +12: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +18: [2023-05-13 01:00:04,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +27: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +27: [2023-05-13 01:00:04,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:04,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:04,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:04,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:04,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +31: [2023-05-13 01:00:04,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:04,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:04,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +25: [2023-05-13 01:00:04,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:04,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:04,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +24: [2023-05-13 01:00:04,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +31: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +20: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +20: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:04,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +28: [2023-05-13 01:00:04,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:04,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:04,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +12: [2023-05-13 01:00:04,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:04,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:04,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:04,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:04,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:04,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:04,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +22: [2023-05-13 01:00:04,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:04,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:04,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:04,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +23: [2023-05-13 01:00:04,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +14: [2023-05-13 01:00:04,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:04,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +11: [2023-05-13 01:00:04,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +21: [2023-05-13 01:00:04,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +10: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +22: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:04,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +25: [2023-05-13 01:00:04,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +28: [2023-05-13 01:00:04,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:04,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +30: [2023-05-13 01:00:04,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +11: [2023-05-13 01:00:04,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:04,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:04,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:04,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +30: [2023-05-13 01:00:04,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +15: [2023-05-13 01:00:04,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +21: [2023-05-13 01:00:04,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +13: [2023-05-13 01:00:04,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +24: [2023-05-13 01:00:04,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:04,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +13: [2023-05-13 01:00:04,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +29: [2023-05-13 01:00:04,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:04,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:04,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... +17: [2023-05-13 01:00:04,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +14: [2023-05-13 01:00:04,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +29: [2023-05-13 01:00:04,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +15: [2023-05-13 01:00:04,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +23: [2023-05-13 01:00:04,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_03-model_00-model_states.pt. +17: [2023-05-13 01:00:04,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +16: [2023-05-13 01:00:04,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:04,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:04,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:04,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:04,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +31: [2023-05-13 01:00:04,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +16: [2023-05-13 01:00:04,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:04,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:04,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:04,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:04,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:04,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:04,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +31: [2023-05-13 01:00:04,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:04,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +26: [2023-05-13 01:00:04,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:04,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:04,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +10: [2023-05-13 01:00:04,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:04,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:04,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +26: [2023-05-13 01:00:04,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:04,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:04,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:04,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +18: [2023-05-13 01:00:04,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +18: [2023-05-13 01:00:04,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:04,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:04,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:04,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:04,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:04,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +10: [2023-05-13 01:00:04,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 8: [2023-05-13 01:00:04,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:04,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:04,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:04,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:04,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +12: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:04,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +27: [2023-05-13 01:00:04,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:04,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:04,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 5: [2023-05-13 01:00:04,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:04,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:04,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +27: [2023-05-13 01:00:04,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:04,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:04,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +21: [2023-05-13 01:00:04,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:04,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +12: [2023-05-13 01:00:04,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:04,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:04,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:04,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:04,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:04,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +21: [2023-05-13 01:00:04,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:04,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +19: [2023-05-13 01:00:04,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +19: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +24: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +14: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +30: [2023-05-13 01:00:04,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +23: [2023-05-13 01:00:04,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +11: [2023-05-13 01:00:04,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:04,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:04,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:04,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 6: [2023-05-13 01:00:04,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:04,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +29: [2023-05-13 01:00:04,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +29: [2023-05-13 01:00:04,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +15: [2023-05-13 01:00:04,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:04,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +11: [2023-05-13 01:00:04,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +13: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +24: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +20: [2023-05-13 01:00:04,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +28: [2023-05-13 01:00:04,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 2: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +28: [2023-05-13 01:00:04,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:04,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +22: [2023-05-13 01:00:04,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +25: [2023-05-13 01:00:04,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt... +17: [2023-05-13 01:00:04,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:04,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:04,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:04,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:04,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +22: [2023-05-13 01:00:04,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 4: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:04,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:04,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +17: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 9: [2023-05-13 01:00:04,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:04,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:04,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +15: [2023-05-13 01:00:04,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:04,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:04,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:04,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:04,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:04,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:04,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 0: [2023-05-13 01:00:04,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:04,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:04,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:04,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:04,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:04,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:04,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:04,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:04,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:04,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +14: [2023-05-13 01:00:04,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:04,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:04,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:04,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +30: [2023-05-13 01:00:04,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:04,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:04,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +25: [2023-05-13 01:00:04,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:04,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:04,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:04,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:04,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:04,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:04,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:04,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:04,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:04,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +23: [2023-05-13 01:00:04,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +13: [2023-05-13 01:00:04,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:04,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:04,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:04,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 1: [2023-05-13 01:00:04,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. +20: [2023-05-13 01:00:04,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_04-model_00-model_states.pt. + 3: [2023-05-13 01:00:04,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:04,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:04,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:04,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:04,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:04,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:04,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:04,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:04,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:04,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:04,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:04,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:04,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:05,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +27: [2023-05-13 01:00:05,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +27: [2023-05-13 01:00:05,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:05,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:05,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +27: [2023-05-13 01:00:05,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:05,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:05,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:05,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:05,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +21: [2023-05-13 01:00:05,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:05,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:05,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:05,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:05,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:05,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:05,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:05,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:05,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +21: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +12: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +16: [2023-05-13 01:00:05,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +26: [2023-05-13 01:00:05,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +16: [2023-05-13 01:00:05,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +26: [2023-05-13 01:00:05,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:05,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:05,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:05,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:05,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:05,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:05,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:05,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:05,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +22: [2023-05-13 01:00:05,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:05,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +10: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +27: [2023-05-13 01:00:05,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:05,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +27: [2023-05-13 01:00:05,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +27: [2023-05-13 01:00:05,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:05,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +27: [2023-05-13 01:00:05,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +12: [2023-05-13 01:00:05,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +11: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +11: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:05,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +19: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +25: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +24: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +18: [2023-05-13 01:00:05,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +22: [2023-05-13 01:00:05,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:05,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:05,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:05,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:05,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +10: [2023-05-13 01:00:05,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +19: [2023-05-13 01:00:05,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +15: [2023-05-13 01:00:05,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +18: [2023-05-13 01:00:05,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:05,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:05,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +24: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:05,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:05,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:05,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:05,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +28: [2023-05-13 01:00:05,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:05,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +15: [2023-05-13 01:00:05,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:05,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +17: [2023-05-13 01:00:05,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:05,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:05,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:05,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:05,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:05,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:05,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:05,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:05,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:05,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:05,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:05,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +17: [2023-05-13 01:00:05,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:05,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +29: [2023-05-13 01:00:05,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +29: [2023-05-13 01:00:05,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:05,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:05,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:05,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 3: [2023-05-13 01:00:05,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +25: [2023-05-13 01:00:05,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:05,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +13: [2023-05-13 01:00:05,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +31: [2023-05-13 01:00:05,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:05,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:05,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:05,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +14: [2023-05-13 01:00:05,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +28: [2023-05-13 01:00:05,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:05,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 2: [2023-05-13 01:00:05,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:05,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:05,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:05,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +31: [2023-05-13 01:00:05,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:05,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +13: [2023-05-13 01:00:05,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:05,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +23: [2023-05-13 01:00:05,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +20: [2023-05-13 01:00:05,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt... +30: [2023-05-13 01:00:05,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:05,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:05,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +30: [2023-05-13 01:00:05,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:05,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:05,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:05,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +23: [2023-05-13 01:00:05,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:05,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:05,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:05,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +20: [2023-05-13 01:00:05,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. +14: [2023-05-13 01:00:05,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:05,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:05,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_05-model_00-model_states.pt. + 1: [2023-05-13 01:00:05,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:05,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:05,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:05,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:05,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +31: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:05,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +21: [2023-05-13 01:00:05,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:05,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:05,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:05,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 5: [2023-05-13 01:00:05,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:05,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:05,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:05,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +31: [2023-05-13 01:00:05,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +31: [2023-05-13 01:00:05,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +31: [2023-05-13 01:00:05,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +31: [2023-05-13 01:00:05,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +31: [2023-05-13 01:00:05,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:05,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:05,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:05,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:05,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:05,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:05,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:05,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:05,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:05,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +10: [2023-05-13 01:00:05,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +19: [2023-05-13 01:00:05,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:05,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:05,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:05,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:05,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:05,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:05,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:05,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:05,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:05,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:05,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:05,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 6: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:05,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:05,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +17: [2023-05-13 01:00:05,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:05,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:05,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:05,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:05,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +25: [2023-05-13 01:00:05,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:05,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:05,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +19: [2023-05-13 01:00:05,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +10: [2023-05-13 01:00:05,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:05,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:05,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:05,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:05,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:05,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:05,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:05,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 0: [2023-05-13 01:00:05,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:05,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:05,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:05,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:05,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:05,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:05,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 9: [2023-05-13 01:00:05,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:05,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:05,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:05,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:05,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:05,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +19: [2023-05-13 01:00:05,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:05,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:05,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:05,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:05,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:05,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:05,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:05,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +27: [2023-05-13 01:00:06,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:06,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +27: [2023-05-13 01:00:06,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:06,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:06,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:06,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:06,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:06,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:06,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:06,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:06,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:06,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +22: [2023-05-13 01:00:06,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:06,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +19: [2023-05-13 01:00:06,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +19: [2023-05-13 01:00:06,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:06,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:06,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:06,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:06,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:06,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:06,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:06,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:06,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:06,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:06,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +15: [2023-05-13 01:00:06,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:06,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:06,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:06,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +24: [2023-05-13 01:00:06,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +28: [2023-05-13 01:00:06,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:06,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:06,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:06,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:06,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +28: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:06,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:06,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:06,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:06,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +15: [2023-05-13 01:00:06,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:06,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:06,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:06,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +25: [2023-05-13 01:00:06,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +21: [2023-05-13 01:00:06,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +11: [2023-05-13 01:00:06,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +27: [2023-05-13 01:00:06,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +24: [2023-05-13 01:00:06,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +22: [2023-05-13 01:00:06,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:06,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:06,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +11: [2023-05-13 01:00:06,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:06,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:06,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:06,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +12: [2023-05-13 01:00:06,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:06,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:06,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:06,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:06,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:06,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:06,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +20: [2023-05-13 01:00:06,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:06,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:06,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:06,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:06,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:06,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:06,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:06,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +30: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:06,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:06,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:06,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +29: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:06,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:06,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +14: [2023-05-13 01:00:06,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:06,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +23: [2023-05-13 01:00:06,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:06,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:06,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:06,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:06,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +18: [2023-05-13 01:00:06,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:06,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +16: [2023-05-13 01:00:06,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +13: [2023-05-13 01:00:06,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... +26: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:06,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +20: [2023-05-13 01:00:06,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +12: [2023-05-13 01:00:06,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:06,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +26: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +16: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +29: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +18: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:06,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +30: [2023-05-13 01:00:06,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:06,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:06,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +17: [2023-05-13 01:00:06,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:06,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:06,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:06,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:06,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +31: [2023-05-13 01:00:06,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:06,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:06,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:06,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:06,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +13: [2023-05-13 01:00:06,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +31: [2023-05-13 01:00:06,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +14: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. +23: [2023-05-13 01:00:06,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_06-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:06,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:06,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +31: [2023-05-13 01:00:06,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +19: [2023-05-13 01:00:06,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +19: [2023-05-13 01:00:06,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +19: [2023-05-13 01:00:06,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:06,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:06,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:06,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +31: [2023-05-13 01:00:06,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +28: [2023-05-13 01:00:06,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +25: [2023-05-13 01:00:06,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:06,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +19: [2023-05-13 01:00:06,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +22: [2023-05-13 01:00:06,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:06,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +28: [2023-05-13 01:00:06,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +21: [2023-05-13 01:00:06,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +21: [2023-05-13 01:00:06,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +15: [2023-05-13 01:00:06,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:06,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:06,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:06,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +15: [2023-05-13 01:00:06,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +22: [2023-05-13 01:00:06,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +24: [2023-05-13 01:00:06,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +11: [2023-05-13 01:00:06,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +24: [2023-05-13 01:00:06,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +26: [2023-05-13 01:00:06,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +27: [2023-05-13 01:00:06,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +12: [2023-05-13 01:00:06,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +27: [2023-05-13 01:00:06,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +12: [2023-05-13 01:00:06,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +16: [2023-05-13 01:00:06,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +30: [2023-05-13 01:00:06,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +18: [2023-05-13 01:00:06,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:06,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +29: [2023-05-13 01:00:06,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +14: [2023-05-13 01:00:06,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +11: [2023-05-13 01:00:06,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +13: [2023-05-13 01:00:06,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +23: [2023-05-13 01:00:06,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +14: [2023-05-13 01:00:06,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +17: [2023-05-13 01:00:06,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +20: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +10: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +29: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt... +13: [2023-05-13 01:00:06,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +26: [2023-05-13 01:00:06,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:06,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +18: [2023-05-13 01:00:06,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:06,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:06,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +10: [2023-05-13 01:00:06,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:06,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +23: [2023-05-13 01:00:06,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +17: [2023-05-13 01:00:06,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +17: [2023-05-13 01:00:06,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +30: [2023-05-13 01:00:06,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:06,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:06,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:06,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:06,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +20: [2023-05-13 01:00:06,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +16: [2023-05-13 01:00:06,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_07-model_00-model_states.pt. +25: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +16: [2023-05-13 01:00:06,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:06,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +17: [2023-05-13 01:00:06,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:06,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:06,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:06,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +22: [2023-05-13 01:00:06,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +31: [2023-05-13 01:00:06,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:06,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +19: [2023-05-13 01:00:06,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +21: [2023-05-13 01:00:06,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:06,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:06,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:06,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:06,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:06,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +15: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 7: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:06,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +28: [2023-05-13 01:00:06,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:06,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:06,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +21: [2023-05-13 01:00:06,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:06,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:06,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:06,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:06,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:06,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:06,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:06,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +19: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 9: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +31: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:06,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:06,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:06,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:06,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:06,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +27: [2023-05-13 01:00:06,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +28: [2023-05-13 01:00:06,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:06,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +15: [2023-05-13 01:00:06,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:06,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:06,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:06,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:06,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:06,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:06,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:06,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:06,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +22: [2023-05-13 01:00:06,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:06,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:06,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:06,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:06,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:06,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:06,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:06,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:06,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:06,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:06,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:06,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:06,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +12: [2023-05-13 01:00:06,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:06,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:06,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 8: [2023-05-13 01:00:06,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:06,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:06,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:06,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +12: [2023-05-13 01:00:06,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +14: [2023-05-13 01:00:06,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 8: [2023-05-13 01:00:06,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:06,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:06,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +27: [2023-05-13 01:00:06,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:06,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:06,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:06,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:06,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:06,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:06,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +11: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +11: [2023-05-13 01:00:06,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:06,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +29: [2023-05-13 01:00:06,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:06,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:06,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:06,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:06,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:06,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:06,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:06,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:06,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:06,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:06,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +16: [2023-05-13 01:00:06,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +30: [2023-05-13 01:00:06,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:06,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:06,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:06,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:06,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:06,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:06,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:06,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +30: [2023-05-13 01:00:06,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:06,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:06,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:06,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:06,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +14: [2023-05-13 01:00:06,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:06,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:06,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:06,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:06,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:06,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:06,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:06,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:06,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:06,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +17: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:06,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:06,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:06,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:06,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +29: [2023-05-13 01:00:06,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:06,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +24: [2023-05-13 01:00:06,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:06,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:06,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 3: [2023-05-13 01:00:06,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:06,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +13: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +26: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +25: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +24: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +23: [2023-05-13 01:00:06,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:06,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +30: [2023-05-13 01:00:06,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:06,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:06,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +10: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +10: [2023-05-13 01:00:06,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:06,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +20: [2023-05-13 01:00:06,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +23: [2023-05-13 01:00:06,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:06,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:06,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... +18: [2023-05-13 01:00:06,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:06,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:06,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:06,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:06,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +30: [2023-05-13 01:00:06,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +26: [2023-05-13 01:00:06,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:06,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +26: [2023-05-13 01:00:06,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:06,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:06,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:06,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:06,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:06,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:06,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:06,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:06,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:06,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:06,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:06,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:06,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:06,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:06,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:06,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:06,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:06,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:06,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:06,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 4: [2023-05-13 01:00:06,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:06,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:06,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +13: [2023-05-13 01:00:06,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:06,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:06,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:06,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:06,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:06,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:06,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:06,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:06,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:06,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:06,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:06,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:06,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:06,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:06,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:07,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:07,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:07,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:07,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:07,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:07,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:07,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +18: [2023-05-13 01:00:07,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:07,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +25: [2023-05-13 01:00:07,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:06,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:06,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:06,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:07,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:07,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:07,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:07,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:07,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:07,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:07,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:07,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:07,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:07,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. +20: [2023-05-13 01:00:07,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_08-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:07,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:07,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:07,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:07,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:07,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:07,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:07,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:07,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:07,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:07,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:07,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:07,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +21: [2023-05-13 01:00:07,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:07,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:07,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:07,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:07,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:07,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:07,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:07,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +28: [2023-05-13 01:00:07,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:07,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:07,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:07,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:07,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +21: [2023-05-13 01:00:07,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:07,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:07,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:07,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:07,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:07,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:07,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:07,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:07,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:07,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:07,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:07,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:07,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:07,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:07,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:07,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:07,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +31: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:07,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:07,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:07,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:07,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:07,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +14: [2023-05-13 01:00:07,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +10: [2023-05-13 01:00:07,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +31: [2023-05-13 01:00:07,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:07,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +10: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:07,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:07,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:07,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:07,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +16: [2023-05-13 01:00:07,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +20: [2023-05-13 01:00:07,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +22: [2023-05-13 01:00:07,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +17: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +16: [2023-05-13 01:00:07,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:07,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +26: [2023-05-13 01:00:07,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:07,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:07,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +14: [2023-05-13 01:00:07,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:07,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +20: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:07,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:07,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:07,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:07,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +25: [2023-05-13 01:00:07,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +25: [2023-05-13 01:00:07,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +13: [2023-05-13 01:00:07,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:07,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:07,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +11: [2023-05-13 01:00:07,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:07,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +24: [2023-05-13 01:00:07,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +19: [2023-05-13 01:00:07,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +27: [2023-05-13 01:00:07,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +27: [2023-05-13 01:00:07,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +30: [2023-05-13 01:00:07,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:07,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +12: [2023-05-13 01:00:07,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:07,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +18: [2023-05-13 01:00:07,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +30: [2023-05-13 01:00:07,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +23: [2023-05-13 01:00:07,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +19: [2023-05-13 01:00:07,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +29: [2023-05-13 01:00:07,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +29: [2023-05-13 01:00:07,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:07,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt... +15: [2023-05-13 01:00:07,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +15: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +30: [2023-05-13 01:00:07,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +12: [2023-05-13 01:00:07,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +13: [2023-05-13 01:00:07,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +23: [2023-05-13 01:00:07,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +28: [2023-05-13 01:00:07,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:07,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:07,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:07,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:07,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +11: [2023-05-13 01:00:07,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +11: [2023-05-13 01:00:07,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +28: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +11: [2023-05-13 01:00:07,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +24: [2023-05-13 01:00:07,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +30: [2023-05-13 01:00:07,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +18: [2023-05-13 01:00:07,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +19: [2023-05-13 01:00:07,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +27: [2023-05-13 01:00:07,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +12: [2023-05-13 01:00:07,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +12: [2023-05-13 01:00:07,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. +22: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_09-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +19: [2023-05-13 01:00:07,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +22: [2023-05-13 01:00:07,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +29: [2023-05-13 01:00:07,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +22: [2023-05-13 01:00:07,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:07,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +29: [2023-05-13 01:00:07,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +14: [2023-05-13 01:00:07,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +14: [2023-05-13 01:00:07,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +10: [2023-05-13 01:00:07,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:07,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:07,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:07,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +10: [2023-05-13 01:00:07,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:07,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +31: [2023-05-13 01:00:07,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +17: [2023-05-13 01:00:07,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:07,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +30: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +16: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +21: [2023-05-13 01:00:07,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +21: [2023-05-13 01:00:07,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +20: [2023-05-13 01:00:07,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +26: [2023-05-13 01:00:07,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +21: [2023-05-13 01:00:07,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:07,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +20: [2023-05-13 01:00:07,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +26: [2023-05-13 01:00:07,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:07,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +26: [2023-05-13 01:00:07,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:07,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +30: [2023-05-13 01:00:07,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:07,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +30: [2023-05-13 01:00:07,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +24: [2023-05-13 01:00:07,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +25: [2023-05-13 01:00:07,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:07,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:07,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +31: [2023-05-13 01:00:07,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:07,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:07,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:07,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +23: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +17: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:07,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:07,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:07,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:07,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:07,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +30: [2023-05-13 01:00:07,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +13: [2023-05-13 01:00:07,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +23: [2023-05-13 01:00:07,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +18: [2023-05-13 01:00:07,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +13: [2023-05-13 01:00:07,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +16: [2023-05-13 01:00:07,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:07,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:07,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:07,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:07,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:07,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:07,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:07,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:07,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:07,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:07,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:07,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:07,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:07,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 0: [2023-05-13 01:00:07,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +25: [2023-05-13 01:00:07,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:07,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt... +15: [2023-05-13 01:00:07,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:07,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +18: [2023-05-13 01:00:07,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +24: [2023-05-13 01:00:07,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +15: [2023-05-13 01:00:07,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:07,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:07,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:07,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:07,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:07,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:07,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:07,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:07,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:07,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:07,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +28: [2023-05-13 01:00:07,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:07,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. +27: [2023-05-13 01:00:07,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:07,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:07,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:07,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:07,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_10-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +28: [2023-05-13 01:00:07,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:07,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:07,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:07,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:07,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:07,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:07,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:07,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +22: [2023-05-13 01:00:07,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +19: [2023-05-13 01:00:07,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +15: [2023-05-13 01:00:07,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:07,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:07,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:07,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:07,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:07,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +15: [2023-05-13 01:00:07,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:07,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:07,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:07,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:07,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +27: [2023-05-13 01:00:07,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:07,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:07,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:07,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:07,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:07,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:07,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:07,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:07,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:07,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:07,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +22: [2023-05-13 01:00:07,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:07,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 5: [2023-05-13 01:00:07,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +29: [2023-05-13 01:00:07,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:07,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:07,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +29: [2023-05-13 01:00:07,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 4: [2023-05-13 01:00:07,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:07,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:07,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:07,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +19: [2023-05-13 01:00:07,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:07,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:07,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:07,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:07,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:07,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:07,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:07,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:07,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +11: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:07,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +14: [2023-05-13 01:00:07,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:07,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:07,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +11: [2023-05-13 01:00:07,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:07,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:07,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:07,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:07,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:07,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:07,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:07,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:07,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:07,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:07,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 7: [2023-05-13 01:00:07,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:07,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:07,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:07,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:07,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:07,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:07,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:07,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:07,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:07,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:07,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:07,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:07,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 7: [2023-05-13 01:00:07,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:07,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:07,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:07,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:07,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:07,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:07,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:07,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:07,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:07,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:07,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:07,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:07,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:07,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +17: [2023-05-13 01:00:07,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:07,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +13: [2023-05-13 01:00:07,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:07,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:07,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:07,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:07,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:07,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:07,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:07,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:07,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:07,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 3: [2023-05-13 01:00:07,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:07,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:07,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:07,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:07,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:07,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:07,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:07,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:07,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:07,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:07,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:07,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:07,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:07,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:07,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:08,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:08,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:08,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:08,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:08,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:08,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:08,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:08,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:08,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:08,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:08,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:08,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:08,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:08,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:08,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:08,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:08,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:08,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:08,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:08,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:08,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:08,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +21: [2023-05-13 01:00:08,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:08,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:08,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:08,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:08,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +21: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:08,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +23: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:08,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:08,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:08,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:08,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +10: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +16: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +23: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +31: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:08,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +24: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +25: [2023-05-13 01:00:08,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +14: [2023-05-13 01:00:08,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:08,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:08,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:08,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:08,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:08,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:08,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:08,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:08,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:08,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:08,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:08,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:08,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:08,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:08,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:08,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +13: [2023-05-13 01:00:08,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:08,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:08,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:08,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +10: [2023-05-13 01:00:08,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:08,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:08,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +30: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +30: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:08,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +18: [2023-05-13 01:00:08,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +20: [2023-05-13 01:00:08,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt... +12: [2023-05-13 01:00:08,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:08,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:08,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:08,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:08,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:08,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +31: [2023-05-13 01:00:08,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +31: [2023-05-13 01:00:08,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:08,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +20: [2023-05-13 01:00:08,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:08,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:08,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:08,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:08,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:08,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:08,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:08,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:08,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +28: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:08,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:08,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:08,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +12: [2023-05-13 01:00:08,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:08,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +26: [2023-05-13 01:00:08,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +25: [2023-05-13 01:00:08,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +25: [2023-05-13 01:00:08,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +17: [2023-05-13 01:00:08,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +26: [2023-05-13 01:00:08,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +24: [2023-05-13 01:00:08,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:08,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:08,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:08,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:08,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:08,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:08,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +16: [2023-05-13 01:00:08,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +27: [2023-05-13 01:00:08,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. +18: [2023-05-13 01:00:08,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_11-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +26: [2023-05-13 01:00:08,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:08,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:08,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:08,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:08,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +15: [2023-05-13 01:00:08,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +28: [2023-05-13 01:00:08,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:08,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +28: [2023-05-13 01:00:08,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +25: [2023-05-13 01:00:08,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +27: [2023-05-13 01:00:08,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +27: [2023-05-13 01:00:08,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +22: [2023-05-13 01:00:08,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +15: [2023-05-13 01:00:08,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +22: [2023-05-13 01:00:08,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +29: [2023-05-13 01:00:08,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +29: [2023-05-13 01:00:08,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +23: [2023-05-13 01:00:08,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +11: [2023-05-13 01:00:08,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +11: [2023-05-13 01:00:08,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +23: [2023-05-13 01:00:08,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:08,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +19: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:08,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +10: [2023-05-13 01:00:08,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +17: [2023-05-13 01:00:08,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +14: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +24: [2023-05-13 01:00:08,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:08,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +14: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:08,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +20: [2023-05-13 01:00:08,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +19: [2023-05-13 01:00:08,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:08,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:08,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +16: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +13: [2023-05-13 01:00:08,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:08,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +30: [2023-05-13 01:00:08,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +24: [2023-05-13 01:00:08,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +18: [2023-05-13 01:00:08,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt... +12: [2023-05-13 01:00:08,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:08,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:08,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:08,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +10: [2023-05-13 01:00:08,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +21: [2023-05-13 01:00:08,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +31: [2023-05-13 01:00:08,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +10: [2023-05-13 01:00:08,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +30: [2023-05-13 01:00:08,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +17: [2023-05-13 01:00:08,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:08,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +12: [2023-05-13 01:00:08,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +16: [2023-05-13 01:00:08,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +20: [2023-05-13 01:00:08,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +12: [2023-05-13 01:00:08,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +18: [2023-05-13 01:00:08,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. +13: [2023-05-13 01:00:08,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_12-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +31: [2023-05-13 01:00:08,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +16: [2023-05-13 01:00:08,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +16: [2023-05-13 01:00:08,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +27: [2023-05-13 01:00:08,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:08,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:08,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +27: [2023-05-13 01:00:08,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +29: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:08,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +11: [2023-05-13 01:00:08,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +26: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +22: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:08,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +25: [2023-05-13 01:00:08,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:08,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +25: [2023-05-13 01:00:08,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:08,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:08,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +22: [2023-05-13 01:00:08,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:08,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:08,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:08,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:08,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +26: [2023-05-13 01:00:08,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:08,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:08,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +28: [2023-05-13 01:00:08,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:08,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:08,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 0: [2023-05-13 01:00:08,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:08,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:08,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +28: [2023-05-13 01:00:08,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:08,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:08,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +25: [2023-05-13 01:00:08,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:08,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +25: [2023-05-13 01:00:08,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +11: [2023-05-13 01:00:08,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:08,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +15: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 4: [2023-05-13 01:00:08,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +14: [2023-05-13 01:00:08,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +25: [2023-05-13 01:00:08,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +14: [2023-05-13 01:00:08,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:08,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:08,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:08,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:08,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:08,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:08,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:08,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:08,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +29: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +15: [2023-05-13 01:00:08,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:08,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:08,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:08,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:08,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +12: [2023-05-13 01:00:08,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:08,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +20: [2023-05-13 01:00:08,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +17: [2023-05-13 01:00:08,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:08,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:08,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 6: [2023-05-13 01:00:08,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:08,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +23: [2023-05-13 01:00:08,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:08,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +21: [2023-05-13 01:00:08,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +13: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +19: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +19: [2023-05-13 01:00:08,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +18: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +24: [2023-05-13 01:00:08,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:08,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... +30: [2023-05-13 01:00:08,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 8: [2023-05-13 01:00:08,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:08,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:08,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 8: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +10: [2023-05-13 01:00:08,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +12: [2023-05-13 01:00:08,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +12: [2023-05-13 01:00:08,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:08,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +18: [2023-05-13 01:00:08,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:08,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:08,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:08,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:08,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:08,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 3: [2023-05-13 01:00:08,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:08,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +12: [2023-05-13 01:00:08,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +17: [2023-05-13 01:00:08,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:08,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:08,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:08,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +20: [2023-05-13 01:00:08,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:08,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:08,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +31: [2023-05-13 01:00:08,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:08,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:08,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:08,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:08,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:08,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +12: [2023-05-13 01:00:08,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:08,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:08,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:08,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:08,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:08,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +13: [2023-05-13 01:00:08,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:08,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +30: [2023-05-13 01:00:08,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:08,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:08,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:08,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:08,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:08,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:08,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:08,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:08,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:08,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:08,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:08,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:08,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +23: [2023-05-13 01:00:08,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +24: [2023-05-13 01:00:08,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_13-model_00-model_states.pt. +21: [2023-05-13 01:00:08,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:08,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:08,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:08,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:08,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:08,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:08,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:08,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:08,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:08,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:08,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:08,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:08,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:08,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:08,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:08,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:08,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:08,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:08,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:08,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:08,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:08,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +16: [2023-05-13 01:00:08,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:08,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:08,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:08,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +16: [2023-05-13 01:00:08,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:08,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:08,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:08,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:08,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:08,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:08,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:08,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:08,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:08,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:08,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:08,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:08,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:08,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:08,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:08,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:08,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:08,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:08,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:09,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:09,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:09,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:09,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:09,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:09,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:09,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:09,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:09,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:09,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:09,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:09,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:09,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:09,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:09,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:09,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:09,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:09,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +14: [2023-05-13 01:00:09,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:09,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:09,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:09,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:09,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:09,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:09,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:09,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:09,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:09,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:09,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +14: [2023-05-13 01:00:09,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:09,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:09,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:09,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:09,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:09,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +28: [2023-05-13 01:00:09,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +21: [2023-05-13 01:00:09,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:09,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:09,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:09,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +29: [2023-05-13 01:00:09,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +26: [2023-05-13 01:00:09,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +28: [2023-05-13 01:00:09,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:09,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:09,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +21: [2023-05-13 01:00:09,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:09,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:09,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:09,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:09,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +17: [2023-05-13 01:00:09,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:09,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:09,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:09,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:09,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:09,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:09,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:09,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +23: [2023-05-13 01:00:09,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:09,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +17: [2023-05-13 01:00:09,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:09,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:09,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:09,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:09,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:09,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +15: [2023-05-13 01:00:09,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:09,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:09,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:09,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:09,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:09,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:09,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:09,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:09,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:09,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:09,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:09,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:09,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +10: [2023-05-13 01:00:09,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +25: [2023-05-13 01:00:09,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +31: [2023-05-13 01:00:09,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +27: [2023-05-13 01:00:09,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +25: [2023-05-13 01:00:09,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +25: [2023-05-13 01:00:09,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +10: [2023-05-13 01:00:09,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:09,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +19: [2023-05-13 01:00:09,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +19: [2023-05-13 01:00:09,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:09,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +15: [2023-05-13 01:00:09,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:09,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:09,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +31: [2023-05-13 01:00:09,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +31: [2023-05-13 01:00:09,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +27: [2023-05-13 01:00:09,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:09,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:09,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:09,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:09,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:09,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:09,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:09,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +20: [2023-05-13 01:00:09,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +11: [2023-05-13 01:00:09,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:09,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:09,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:09,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:09,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:09,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:09,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:09,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +24: [2023-05-13 01:00:09,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:09,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:09,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:09,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:09,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:09,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +14: [2023-05-13 01:00:09,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +25: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +25: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +14: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +14: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +25: [2023-05-13 01:00:09,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +30: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +12: [2023-05-13 01:00:09,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +12: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +12: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +20: [2023-05-13 01:00:09,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +27: [2023-05-13 01:00:09,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +27: [2023-05-13 01:00:09,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +16: [2023-05-13 01:00:09,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +16: [2023-05-13 01:00:09,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:09,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:09,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:09,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:09,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +13: [2023-05-13 01:00:09,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +11: [2023-05-13 01:00:09,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +14: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +14: [2023-05-13 01:00:09,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +18: [2023-05-13 01:00:09,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:09,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +24: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +18: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +14: [2023-05-13 01:00:09,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +11: [2023-05-13 01:00:09,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +11: [2023-05-13 01:00:09,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +29: [2023-05-13 01:00:09,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +22: [2023-05-13 01:00:09,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... +14: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +30: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +12: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +14: [2023-05-13 01:00:09,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:09,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:09,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +22: [2023-05-13 01:00:09,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +14: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +22: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +29: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +29: [2023-05-13 01:00:09,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +19: [2023-05-13 01:00:09,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:09,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +26: [2023-05-13 01:00:09,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +26: [2023-05-13 01:00:09,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +23: [2023-05-13 01:00:09,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +13: [2023-05-13 01:00:09,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. +26: [2023-05-13 01:00:09,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +28: [2023-05-13 01:00:09,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_14-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:09,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:09,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:09,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:09,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +28: [2023-05-13 01:00:09,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +23: [2023-05-13 01:00:09,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +23: [2023-05-13 01:00:09,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +15: [2023-05-13 01:00:09,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +15: [2023-05-13 01:00:09,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +19: [2023-05-13 01:00:09,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:09,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +21: [2023-05-13 01:00:09,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +20: [2023-05-13 01:00:09,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:09,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +21: [2023-05-13 01:00:09,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:09,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +20: [2023-05-13 01:00:09,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:09,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +25: [2023-05-13 01:00:09,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +25: [2023-05-13 01:00:09,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +17: [2023-05-13 01:00:09,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +17: [2023-05-13 01:00:09,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:09,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:09,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +24: [2023-05-13 01:00:09,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +24: [2023-05-13 01:00:09,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:09,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:09,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +13: [2023-05-13 01:00:09,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +30: [2023-05-13 01:00:09,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +12: [2023-05-13 01:00:09,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +18: [2023-05-13 01:00:09,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +30: [2023-05-13 01:00:09,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... +10: [2023-05-13 01:00:09,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +10: [2023-05-13 01:00:09,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +13: [2023-05-13 01:00:09,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +18: [2023-05-13 01:00:09,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +22: [2023-05-13 01:00:09,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:09,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +12: [2023-05-13 01:00:09,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_15-model_00-model_states.pt. +31: [2023-05-13 01:00:09,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:09,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:09,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:09,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:09,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:09,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:09,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:09,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:09,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:09,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:09,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:09,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:09,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:09,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:09,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:09,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:09,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 6: [2023-05-13 01:00:09,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:09,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:09,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:09,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 6: [2023-05-13 01:00:09,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:09,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +16: [2023-05-13 01:00:09,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:09,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:09,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:09,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:09,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:09,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +26: [2023-05-13 01:00:09,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:09,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:09,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:09,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:09,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:09,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:09,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:09,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +30: [2023-05-13 01:00:09,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:09,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:09,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:09,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:09,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:09,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:09,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:09,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:09,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:09,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:09,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:09,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:09,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +14: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +10: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +26: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +21: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:09,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:09,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:09,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +28: [2023-05-13 01:00:09,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +21: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:09,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 5: [2023-05-13 01:00:09,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:09,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:09,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:09,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +17: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:09,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +28: [2023-05-13 01:00:09,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:09,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:09,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:09,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:09,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +19: [2023-05-13 01:00:09,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:09,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:09,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +17: [2023-05-13 01:00:09,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:09,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:09,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:09,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:09,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:09,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +30: [2023-05-13 01:00:09,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +22: [2023-05-13 01:00:09,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:09,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:09,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:09,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +19: [2023-05-13 01:00:09,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:09,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:09,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:09,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:09,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:09,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:09,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +10: [2023-05-13 01:00:09,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:09,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:09,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:09,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:09,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:09,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:09,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:09,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:09,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:09,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:09,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:09,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:09,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +23: [2023-05-13 01:00:09,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:09,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +15: [2023-05-13 01:00:09,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 3: [2023-05-13 01:00:09,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:09,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:09,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:09,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +22: [2023-05-13 01:00:09,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:09,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:09,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:09,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:09,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +23: [2023-05-13 01:00:09,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:09,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:09,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +15: [2023-05-13 01:00:09,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:09,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:09,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:09,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:09,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +25: [2023-05-13 01:00:09,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +12: [2023-05-13 01:00:09,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +18: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:09,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:09,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +27: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:09,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +18: [2023-05-13 01:00:09,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:09,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:09,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +24: [2023-05-13 01:00:09,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:09,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +20: [2023-05-13 01:00:09,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:09,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:09,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:09,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:09,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +11: [2023-05-13 01:00:09,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:09,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:09,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:09,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:09,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 9: [2023-05-13 01:00:09,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:09,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:09,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:09,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:09,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:09,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:09,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 1: [2023-05-13 01:00:09,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:10,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +31: [2023-05-13 01:00:10,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:10,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:10,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:10,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:10,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:10,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:10,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:10,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:10,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +29: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:10,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:10,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... +13: [2023-05-13 01:00:10,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:10,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:10,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +31: [2023-05-13 01:00:10,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:10,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:10,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:10,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:10,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:10,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:10,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:10,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:10,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:10,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:10,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:10,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +25: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:10,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +14: [2023-05-13 01:00:10,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:10,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +27: [2023-05-13 01:00:10,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:10,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:10,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:10,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:10,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:10,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +24: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +16: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:10,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:10,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:10,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:10,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:10,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +20: [2023-05-13 01:00:10,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:10,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:10,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +11: [2023-05-13 01:00:10,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +13: [2023-05-13 01:00:10,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:10,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +12: [2023-05-13 01:00:10,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_16-model_00-model_states.pt. +29: [2023-05-13 01:00:10,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:10,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:10,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:10,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:10,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +26: [2023-05-13 01:00:10,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:10,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:10,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:10,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:10,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:10,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:10,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:10,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +14: [2023-05-13 01:00:10,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:10,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:10,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:10,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:10,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +21: [2023-05-13 01:00:10,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:10,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +21: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +21: [2023-05-13 01:00:10,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:10,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:10,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:10,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:10,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:10,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:10,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:10,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:10,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:10,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:10,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:10,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +22: [2023-05-13 01:00:10,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:10,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:10,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:10,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +22: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:10,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:10,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:10,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:10,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:10,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:10,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +10: [2023-05-13 01:00:10,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:10,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:10,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:10,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:10,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +10: [2023-05-13 01:00:10,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:10,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:10,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:10,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +27: [2023-05-13 01:00:10,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +27: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +27: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +27: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:10,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:10,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:10,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +24: [2023-05-13 01:00:10,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:10,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +27: [2023-05-13 01:00:10,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:10,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:10,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +12: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +11: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +31: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:10,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +19: [2023-05-13 01:00:10,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +23: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +18: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +17: [2023-05-13 01:00:10,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +20: [2023-05-13 01:00:10,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +15: [2023-05-13 01:00:10,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:10,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +29: [2023-05-13 01:00:10,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:10,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +18: [2023-05-13 01:00:10,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +17: [2023-05-13 01:00:10,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +15: [2023-05-13 01:00:10,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +27: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +27: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +27: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +27: [2023-05-13 01:00:10,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:10,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:10,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +17: [2023-05-13 01:00:10,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +23: [2023-05-13 01:00:10,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +27: [2023-05-13 01:00:10,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +19: [2023-05-13 01:00:10,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +26: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +31: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +29: [2023-05-13 01:00:10,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +11: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +11: [2023-05-13 01:00:10,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +25: [2023-05-13 01:00:10,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +25: [2023-05-13 01:00:10,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +27: [2023-05-13 01:00:10,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +16: [2023-05-13 01:00:10,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +11: [2023-05-13 01:00:10,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +12: [2023-05-13 01:00:10,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +16: [2023-05-13 01:00:10,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +20: [2023-05-13 01:00:10,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +29: [2023-05-13 01:00:10,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +29: [2023-05-13 01:00:10,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +14: [2023-05-13 01:00:10,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +16: [2023-05-13 01:00:10,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +28: [2023-05-13 01:00:10,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +14: [2023-05-13 01:00:10,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +26: [2023-05-13 01:00:10,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +16: [2023-05-13 01:00:10,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +30: [2023-05-13 01:00:10,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +30: [2023-05-13 01:00:10,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +13: [2023-05-13 01:00:10,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... +28: [2023-05-13 01:00:10,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +28: [2023-05-13 01:00:10,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +28: [2023-05-13 01:00:10,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +13: [2023-05-13 01:00:10,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. +24: [2023-05-13 01:00:10,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_17-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +12: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +25: [2023-05-13 01:00:10,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +23: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +24: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +20: [2023-05-13 01:00:10,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +18: [2023-05-13 01:00:10,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +22: [2023-05-13 01:00:10,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +30: [2023-05-13 01:00:10,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +30: [2023-05-13 01:00:10,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:10,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +19: [2023-05-13 01:00:10,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +15: [2023-05-13 01:00:10,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +15: [2023-05-13 01:00:10,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +18: [2023-05-13 01:00:10,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:10,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +23: [2023-05-13 01:00:10,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +24: [2023-05-13 01:00:10,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +19: [2023-05-13 01:00:10,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:10,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +25: [2023-05-13 01:00:10,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +22: [2023-05-13 01:00:10,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:10,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +12: [2023-05-13 01:00:10,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:10,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +20: [2023-05-13 01:00:10,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +31: [2023-05-13 01:00:10,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +10: [2023-05-13 01:00:10,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:10,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:10,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +17: [2023-05-13 01:00:10,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:10,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +10: [2023-05-13 01:00:10,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +10: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +13: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +14: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt... +31: [2023-05-13 01:00:10,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:10,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:10,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +26: [2023-05-13 01:00:10,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +17: [2023-05-13 01:00:10,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:10,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +27: [2023-05-13 01:00:10,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:10,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +17: [2023-05-13 01:00:10,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +31: [2023-05-13 01:00:10,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:10,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:10,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:10,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:10,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +31: [2023-05-13 01:00:10,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:10,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:10,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:10,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:10,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:10,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:10,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:10,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +13: [2023-05-13 01:00:10,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_18-model_00-model_states.pt. +21: [2023-05-13 01:00:10,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:10,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:10,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:10,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:10,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +14: [2023-05-13 01:00:10,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:10,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:10,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:10,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:10,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +26: [2023-05-13 01:00:10,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:10,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +14: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:10,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +21: [2023-05-13 01:00:10,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:10,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:10,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:10,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:10,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:10,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:10,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:10,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +29: [2023-05-13 01:00:10,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:10,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:10,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:10,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:10,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +29: [2023-05-13 01:00:10,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:10,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +11: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:10,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:10,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 0: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:10,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:10,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +16: [2023-05-13 01:00:10,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +11: [2023-05-13 01:00:10,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:10,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:10,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:10,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:10,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:10,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:10,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:10,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:10,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:10,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +20: [2023-05-13 01:00:10,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +22: [2023-05-13 01:00:10,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 6: [2023-05-13 01:00:10,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:10,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 5: [2023-05-13 01:00:10,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +20: [2023-05-13 01:00:10,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +15: [2023-05-13 01:00:10,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +19: [2023-05-13 01:00:10,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +30: [2023-05-13 01:00:10,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 5: [2023-05-13 01:00:10,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:10,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:10,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +18: [2023-05-13 01:00:10,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:10,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:10,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:10,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:10,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +23: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:10,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:10,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +12: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:10,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:10,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +15: [2023-05-13 01:00:10,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:10,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:10,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:10,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:10,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:10,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:10,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +23: [2023-05-13 01:00:10,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:10,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +19: [2023-05-13 01:00:10,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:10,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:10,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:10,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:10,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:10,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:10,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:10,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:10,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +30: [2023-05-13 01:00:10,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +22: [2023-05-13 01:00:10,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:10,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:10,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +12: [2023-05-13 01:00:10,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +25: [2023-05-13 01:00:10,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:10,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:10,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:10,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:10,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:10,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +20: [2023-05-13 01:00:10,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:10,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:10,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:10,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:10,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:10,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:10,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:10,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:10,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +25: [2023-05-13 01:00:10,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 1: [2023-05-13 01:00:10,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:10,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:10,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:10,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:10,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:10,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:10,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:10,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:10,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:10,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:10,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:10,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:10,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:10,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:10,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:10,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:10,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:10,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:10,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:10,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:10,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +10: [2023-05-13 01:00:10,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:10,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:10,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:10,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:10,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 8: [2023-05-13 01:00:10,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:10,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:10,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:10,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:10,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:10,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:10,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:10,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +27: [2023-05-13 01:00:10,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:10,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:10,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:10,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +28: [2023-05-13 01:00:10,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +24: [2023-05-13 01:00:10,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:10,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:10,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:10,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +24: [2023-05-13 01:00:10,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:11,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:11,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +21: [2023-05-13 01:00:11,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:11,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:11,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:11,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +27: [2023-05-13 01:00:11,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:11,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:11,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:11,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:11,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:11,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:11,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:11,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:11,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:11,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +28: [2023-05-13 01:00:11,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +21: [2023-05-13 01:00:11,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:11,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:11,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:11,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +13: [2023-05-13 01:00:11,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... +16: [2023-05-13 01:00:11,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:11,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:11,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:11,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:11,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:11,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:11,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:11,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:11,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:11,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:11,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:11,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:11,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +13: [2023-05-13 01:00:11,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +18: [2023-05-13 01:00:11,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:11,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:11,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:11,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:11,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:11,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:11,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +11: [2023-05-13 01:00:11,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_19-model_00-model_states.pt. +26: [2023-05-13 01:00:11,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:11,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +26: [2023-05-13 01:00:11,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +26: [2023-05-13 01:00:11,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:11,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:11,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:11,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:11,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +19: [2023-05-13 01:00:11,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:11,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:11,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +12: [2023-05-13 01:00:11,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +31: [2023-05-13 01:00:11,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +23: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:11,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +31: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:11,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +15: [2023-05-13 01:00:11,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +17: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +24: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:11,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:11,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:11,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:11,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:11,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +25: [2023-05-13 01:00:11,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +30: [2023-05-13 01:00:11,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:11,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +14: [2023-05-13 01:00:11,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +18: [2023-05-13 01:00:11,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +16: [2023-05-13 01:00:11,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +16: [2023-05-13 01:00:11,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +14: [2023-05-13 01:00:11,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +23: [2023-05-13 01:00:11,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +18: [2023-05-13 01:00:11,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +11: [2023-05-13 01:00:11,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +30: [2023-05-13 01:00:11,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +24: [2023-05-13 01:00:11,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +12: [2023-05-13 01:00:11,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +19: [2023-05-13 01:00:11,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +25: [2023-05-13 01:00:11,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +10: [2023-05-13 01:00:11,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +10: [2023-05-13 01:00:11,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:11,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:11,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:11,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:11,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:11,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:11,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +10: [2023-05-13 01:00:11,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:11,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:11,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +28: [2023-05-13 01:00:11,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:11,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +20: [2023-05-13 01:00:11,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:11,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +20: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:11,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +10: [2023-05-13 01:00:11,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:11,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +28: [2023-05-13 01:00:11,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:11,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +22: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +20: [2023-05-13 01:00:11,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:11,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +20: [2023-05-13 01:00:11,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:11,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:11,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:11,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +20: [2023-05-13 01:00:11,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +27: [2023-05-13 01:00:11,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +20: [2023-05-13 01:00:11,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +20: [2023-05-13 01:00:11,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +27: [2023-05-13 01:00:11,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:11,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +21: [2023-05-13 01:00:11,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +21: [2023-05-13 01:00:11,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +29: [2023-05-13 01:00:11,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:11,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +13: [2023-05-13 01:00:11,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt... +22: [2023-05-13 01:00:11,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +22: [2023-05-13 01:00:11,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +22: [2023-05-13 01:00:11,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +29: [2023-05-13 01:00:11,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +13: [2023-05-13 01:00:11,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +29: [2023-05-13 01:00:11,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +15: [2023-05-13 01:00:11,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_20-model_00-model_states.pt. +17: [2023-05-13 01:00:11,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +29: [2023-05-13 01:00:11,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +17: [2023-05-13 01:00:11,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:11,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +15: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:11,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:11,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +14: [2023-05-13 01:00:11,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +31: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +31: [2023-05-13 01:00:11,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +15: [2023-05-13 01:00:11,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:11,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +14: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +17: [2023-05-13 01:00:11,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +11: [2023-05-13 01:00:11,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:11,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +25: [2023-05-13 01:00:11,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:11,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +11: [2023-05-13 01:00:11,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:11,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +16: [2023-05-13 01:00:11,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +12: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +23: [2023-05-13 01:00:11,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:11,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +25: [2023-05-13 01:00:11,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +24: [2023-05-13 01:00:11,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +12: [2023-05-13 01:00:11,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +19: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +19: [2023-05-13 01:00:11,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +24: [2023-05-13 01:00:11,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:11,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:11,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +23: [2023-05-13 01:00:11,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:11,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:11,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:11,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:11,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:11,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +24: [2023-05-13 01:00:11,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:11,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:11,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 3: [2023-05-13 01:00:11,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:11,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:11,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +30: [2023-05-13 01:00:11,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:11,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:11,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:11,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:11,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +30: [2023-05-13 01:00:11,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 7: [2023-05-13 01:00:11,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:11,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:11,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +18: [2023-05-13 01:00:11,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 9: [2023-05-13 01:00:11,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +18: [2023-05-13 01:00:11,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 8: [2023-05-13 01:00:11,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +16: [2023-05-13 01:00:11,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +26: [2023-05-13 01:00:11,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 5: [2023-05-13 01:00:11,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:11,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +26: [2023-05-13 01:00:11,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:11,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:11,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:11,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:11,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:11,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:11,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:11,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 1: [2023-05-13 01:00:11,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:11,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:11,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +13: [2023-05-13 01:00:11,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +28: [2023-05-13 01:00:11,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +13: [2023-05-13 01:00:11,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +28: [2023-05-13 01:00:11,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... +20: [2023-05-13 01:00:11,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:11,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:11,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:11,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:11,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:11,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:11,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:11,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +27: [2023-05-13 01:00:11,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:11,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:11,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:11,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:11,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:11,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:11,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:11,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:11,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:11,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:11,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:11,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:11,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:11,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:11,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:11,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:11,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:11,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:11,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:11,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +21: [2023-05-13 01:00:11,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:11,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:11,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:11,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_21-model_00-model_states.pt. +20: [2023-05-13 01:00:11,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:11,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +22: [2023-05-13 01:00:11,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:11,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:11,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:11,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:11,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:11,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:11,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:11,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:11,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:11,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:11,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:11,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:11,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:11,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:11,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:11,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +15: [2023-05-13 01:00:11,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 0: [2023-05-13 01:00:11,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:11,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:11,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:11,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:11,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:11,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:11,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:11,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +31: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:11,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +14: [2023-05-13 01:00:11,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:11,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:11,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +12: [2023-05-13 01:00:11,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:11,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:11,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:11,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:11,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:11,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:11,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:11,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:11,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:11,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:11,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:11,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:11,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:11,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:11,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:12,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:12,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:12,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:12,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:12,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +31: [2023-05-13 01:00:12,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:12,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:12,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:12,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:12,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:12,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:12,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:12,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:12,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:12,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:12,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +14: [2023-05-13 01:00:12,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:12,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:12,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:12,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:12,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +15: [2023-05-13 01:00:12,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:12,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:12,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +24: [2023-05-13 01:00:12,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:12,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:12,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:12,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:12,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:12,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:12,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:12,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:12,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:12,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:12,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:12,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:12,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:12,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:12,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +11: [2023-05-13 01:00:12,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:12,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:12,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +18: [2023-05-13 01:00:12,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:12,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +17: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:12,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:12,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:12,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:12,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +17: [2023-05-13 01:00:12,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:12,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:12,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:12,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:12,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:12,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:12,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:12,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:12,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:12,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +30: [2023-05-13 01:00:12,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:12,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:12,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +29: [2023-05-13 01:00:12,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:12,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +25: [2023-05-13 01:00:12,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:12,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:12,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +11: [2023-05-13 01:00:12,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:12,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:12,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:12,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:12,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +29: [2023-05-13 01:00:12,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:12,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:12,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +18: [2023-05-13 01:00:12,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:12,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +19: [2023-05-13 01:00:12,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:12,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +18: [2023-05-13 01:00:12,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +18: [2023-05-13 01:00:12,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +18: [2023-05-13 01:00:12,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +18: [2023-05-13 01:00:12,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +12: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:12,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:12,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:12,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:12,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:12,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +26: [2023-05-13 01:00:12,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:12,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:12,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:12,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +25: [2023-05-13 01:00:12,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:12,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:12,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:12,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:12,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:12,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:12,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +28: [2023-05-13 01:00:12,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:12,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +24: [2023-05-13 01:00:12,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:12,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +24: [2023-05-13 01:00:12,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:12,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:12,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:12,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +13: [2023-05-13 01:00:12,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +21: [2023-05-13 01:00:12,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:12,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:12,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:12,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:12,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:12,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +10: [2023-05-13 01:00:12,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +20: [2023-05-13 01:00:12,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +27: [2023-05-13 01:00:12,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +16: [2023-05-13 01:00:12,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt... +23: [2023-05-13 01:00:12,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +27: [2023-05-13 01:00:12,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +30: [2023-05-13 01:00:12,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +21: [2023-05-13 01:00:12,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:12,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +16: [2023-05-13 01:00:12,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:12,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +28: [2023-05-13 01:00:12,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +10: [2023-05-13 01:00:12,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:12,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +23: [2023-05-13 01:00:12,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +26: [2023-05-13 01:00:12,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +19: [2023-05-13 01:00:12,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +13: [2023-05-13 01:00:12,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:12,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +20: [2023-05-13 01:00:12,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_22-model_00-model_states.pt. +22: [2023-05-13 01:00:12,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +27: [2023-05-13 01:00:12,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +27: [2023-05-13 01:00:12,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +27: [2023-05-13 01:00:12,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +27: [2023-05-13 01:00:12,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +27: [2023-05-13 01:00:12,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +27: [2023-05-13 01:00:12,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +27: [2023-05-13 01:00:12,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +27: [2023-05-13 01:00:12,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:12,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +10: [2023-05-13 01:00:12,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +27: [2023-05-13 01:00:12,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +31: [2023-05-13 01:00:12,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +27: [2023-05-13 01:00:12,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +27: [2023-05-13 01:00:12,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:12,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 4: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 4: [2023-05-13 01:00:12,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +14: [2023-05-13 01:00:12,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +21: [2023-05-13 01:00:12,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +29: [2023-05-13 01:00:12,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:12,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +10: [2023-05-13 01:00:12,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +17: [2023-05-13 01:00:12,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 6: [2023-05-13 01:00:12,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +10: [2023-05-13 01:00:12,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +10: [2023-05-13 01:00:12,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +21: [2023-05-13 01:00:12,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:12,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:12,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +17: [2023-05-13 01:00:12,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:12,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 7: [2023-05-13 01:00:12,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +21: [2023-05-13 01:00:12,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +29: [2023-05-13 01:00:12,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 7: [2023-05-13 01:00:12,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +21: [2023-05-13 01:00:12,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:12,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:12,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +24: [2023-05-13 01:00:12,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +24: [2023-05-13 01:00:12,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +24: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +19: [2023-05-13 01:00:12,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +16: [2023-05-13 01:00:12,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +15: [2023-05-13 01:00:12,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:12,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +11: [2023-05-13 01:00:12,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +15: [2023-05-13 01:00:12,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:12,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:12,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +24: [2023-05-13 01:00:12,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +28: [2023-05-13 01:00:12,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +22: [2023-05-13 01:00:12,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:12,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:12,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +28: [2023-05-13 01:00:12,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:12,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +22: [2023-05-13 01:00:12,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +30: [2023-05-13 01:00:12,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +22: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +18: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +11: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +18: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +12: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +13: [2023-05-13 01:00:12,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +13: [2023-05-13 01:00:12,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +25: [2023-05-13 01:00:12,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +26: [2023-05-13 01:00:12,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +30: [2023-05-13 01:00:12,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +24: [2023-05-13 01:00:12,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +25: [2023-05-13 01:00:12,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +22: [2023-05-13 01:00:12,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:12,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:12,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +12: [2023-05-13 01:00:12,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +23: [2023-05-13 01:00:12,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +16: [2023-05-13 01:00:12,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +20: [2023-05-13 01:00:12,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... + 1: [2023-05-13 01:00:12,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt... +23: [2023-05-13 01:00:12,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +19: [2023-05-13 01:00:12,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:12,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:12,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +18: [2023-05-13 01:00:12,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:12,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:12,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +31: [2023-05-13 01:00:12,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +26: [2023-05-13 01:00:12,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:12,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +20: [2023-05-13 01:00:12,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_23-model_00-model_states.pt. +14: [2023-05-13 01:00:12,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +31: [2023-05-13 01:00:12,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 0: [2023-05-13 01:00:12,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +14: [2023-05-13 01:00:12,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:12,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:12,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +31: [2023-05-13 01:00:12,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:12,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:12,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:12,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +14: [2023-05-13 01:00:12,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 2: [2023-05-13 01:00:12,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +17: [2023-05-13 01:00:12,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:12,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +23: [2023-05-13 01:00:12,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:12,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:12,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:12,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +23: [2023-05-13 01:00:12,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:12,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:12,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:12,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +17: [2023-05-13 01:00:12,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +15: [2023-05-13 01:00:12,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:12,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +15: [2023-05-13 01:00:12,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +29: [2023-05-13 01:00:12,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:12,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:12,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:12,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +29: [2023-05-13 01:00:12,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:12,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:12,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:12,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +25: [2023-05-13 01:00:12,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:12,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +25: [2023-05-13 01:00:12,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:12,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 9: [2023-05-13 01:00:12,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:12,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 9: [2023-05-13 01:00:12,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:12,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:12,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +11: [2023-05-13 01:00:12,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +11: [2023-05-13 01:00:12,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:12,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:12,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:12,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:12,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:12,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:12,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:12,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:12,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:12,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:12,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:12,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:12,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:12,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:12,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:12,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:12,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:12,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:12,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:12,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +16: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:12,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:12,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:13,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:13,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:13,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:13,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:13,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:13,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:13,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:13,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:13,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:13,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:13,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:13,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:13,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +20: [2023-05-13 01:00:13,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:13,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:13,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:13,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:13,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:13,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:13,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:13,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:13,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:13,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:13,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +24: [2023-05-13 01:00:13,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +16: [2023-05-13 01:00:13,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +18: [2023-05-13 01:00:13,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +24: [2023-05-13 01:00:13,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:13,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:13,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:13,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +12: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:13,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:13,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:13,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:13,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +12: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +13: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:13,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +28: [2023-05-13 01:00:13,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +26: [2023-05-13 01:00:13,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:13,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:13,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:13,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:13,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:13,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +19: [2023-05-13 01:00:13,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt... +30: [2023-05-13 01:00:13,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:13,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:13,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:13,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +30: [2023-05-13 01:00:13,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:13,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +18: [2023-05-13 01:00:13,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +20: [2023-05-13 01:00:13,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +26: [2023-05-13 01:00:13,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +19: [2023-05-13 01:00:13,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +28: [2023-05-13 01:00:13,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_24-model_00-model_states.pt. +13: [2023-05-13 01:00:13,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:13,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:13,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:13,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:13,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:13,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:13,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +15: [2023-05-13 01:00:13,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +15: [2023-05-13 01:00:13,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +25: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:13,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +29: [2023-05-13 01:00:13,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:13,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:13,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +29: [2023-05-13 01:00:13,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +17: [2023-05-13 01:00:13,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +17: [2023-05-13 01:00:13,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +23: [2023-05-13 01:00:13,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +23: [2023-05-13 01:00:13,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +12: [2023-05-13 01:00:13,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +22: [2023-05-13 01:00:13,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +12: [2023-05-13 01:00:13,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +22: [2023-05-13 01:00:13,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +13: [2023-05-13 01:00:13,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +13: [2023-05-13 01:00:13,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +19: [2023-05-13 01:00:13,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +18: [2023-05-13 01:00:13,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +19: [2023-05-13 01:00:13,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +18: [2023-05-13 01:00:13,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:13,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:13,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:13,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:13,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:13,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:13,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +31: [2023-05-13 01:00:13,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +10: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +31: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +20: [2023-05-13 01:00:13,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +27: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +24: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +16: [2023-05-13 01:00:13,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +30: [2023-05-13 01:00:13,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +14: [2023-05-13 01:00:13,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +26: [2023-05-13 01:00:13,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +16: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +10: [2023-05-13 01:00:13,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +21: [2023-05-13 01:00:13,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +11: [2023-05-13 01:00:13,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... +28: [2023-05-13 01:00:13,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:13,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +25: [2023-05-13 01:00:13,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +21: [2023-05-13 01:00:13,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:13,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:13,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:13,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +21: [2023-05-13 01:00:13,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:13,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +14: [2023-05-13 01:00:13,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:13,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +30: [2023-05-13 01:00:13,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +21: [2023-05-13 01:00:13,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:13,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +26: [2023-05-13 01:00:13,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +27: [2023-05-13 01:00:13,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:13,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:13,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:13,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:13,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 7: [2023-05-13 01:00:13,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +27: [2023-05-13 01:00:13,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:13,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +20: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 7: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +28: [2023-05-13 01:00:13,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +14: [2023-05-13 01:00:13,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:13,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:13,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +24: [2023-05-13 01:00:13,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. +11: [2023-05-13 01:00:13,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +27: [2023-05-13 01:00:13,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:13,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +14: [2023-05-13 01:00:13,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +11: [2023-05-13 01:00:13,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_25-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:13,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:13,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:13,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:13,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:13,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:13,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +11: [2023-05-13 01:00:13,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:13,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +25: [2023-05-13 01:00:13,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:13,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:13,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:13,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:13,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +25: [2023-05-13 01:00:13,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:13,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +17: [2023-05-13 01:00:13,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:13,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 9: [2023-05-13 01:00:13,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:13,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:13,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:13,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:13,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +17: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:13,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 2: [2023-05-13 01:00:13,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +17: [2023-05-13 01:00:13,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:13,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:13,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:13,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:13,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 6: [2023-05-13 01:00:13,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:13,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +15: [2023-05-13 01:00:13,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +15: [2023-05-13 01:00:13,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:13,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:13,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:13,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +17: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +29: [2023-05-13 01:00:13,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:13,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +17: [2023-05-13 01:00:13,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +29: [2023-05-13 01:00:13,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +17: [2023-05-13 01:00:13,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +23: [2023-05-13 01:00:13,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:13,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:13,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:13,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:13,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 4: [2023-05-13 01:00:13,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:13,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:13,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +23: [2023-05-13 01:00:13,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:13,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +22: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +31: [2023-05-13 01:00:13,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:13,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:13,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +22: [2023-05-13 01:00:13,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:13,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +31: [2023-05-13 01:00:13,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:13,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:13,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +12: [2023-05-13 01:00:13,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +12: [2023-05-13 01:00:13,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:13,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:13,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:13,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:13,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +19: [2023-05-13 01:00:13,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:13,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:13,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +19: [2023-05-13 01:00:13,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 3: [2023-05-13 01:00:13,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +20: [2023-05-13 01:00:13,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +13: [2023-05-13 01:00:13,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:13,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +13: [2023-05-13 01:00:13,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:13,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:13,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +26: [2023-05-13 01:00:13,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +10: [2023-05-13 01:00:13,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:13,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:13,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 5: [2023-05-13 01:00:13,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:13,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:13,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:13,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:13,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:13,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +10: [2023-05-13 01:00:13,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +18: [2023-05-13 01:00:13,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:13,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 5: [2023-05-13 01:00:13,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +16: [2023-05-13 01:00:13,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +18: [2023-05-13 01:00:13,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +16: [2023-05-13 01:00:13,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +16: [2023-05-13 01:00:13,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +24: [2023-05-13 01:00:13,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +16: [2023-05-13 01:00:13,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +16: [2023-05-13 01:00:13,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +30: [2023-05-13 01:00:13,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:13,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... +28: [2023-05-13 01:00:13,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:13,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:13,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:13,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:13,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 1: [2023-05-13 01:00:13,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:13,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:13,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 0: [2023-05-13 01:00:13,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:13,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:13,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. + 8: [2023-05-13 01:00:13,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:13,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:13,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +20: [2023-05-13 01:00:13,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +28: [2023-05-13 01:00:13,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:13,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:13,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:13,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +30: [2023-05-13 01:00:13,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:13,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:13,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:13,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +26: [2023-05-13 01:00:14,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:14,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:14,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:14,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:14,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_26-model_00-model_states.pt. +24: [2023-05-13 01:00:14,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:14,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:14,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +14: [2023-05-13 01:00:14,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:14,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:14,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:14,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +11: [2023-05-13 01:00:14,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:14,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:14,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:14,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:14,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:14,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +27: [2023-05-13 01:00:14,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +11: [2023-05-13 01:00:14,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:14,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +17: [2023-05-13 01:00:14,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +17: [2023-05-13 01:00:14,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +17: [2023-05-13 01:00:14,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +19: [2023-05-13 01:00:14,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +21: [2023-05-13 01:00:14,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +29: [2023-05-13 01:00:14,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +22: [2023-05-13 01:00:14,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +22: [2023-05-13 01:00:14,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:14,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:14,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:14,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:14,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:14,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:14,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:14,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:14,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +15: [2023-05-13 01:00:14,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +17: [2023-05-13 01:00:14,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:14,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:14,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:14,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:14,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:14,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:14,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +12: [2023-05-13 01:00:14,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +17: [2023-05-13 01:00:14,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +19: [2023-05-13 01:00:14,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +25: [2023-05-13 01:00:14,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:14,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:14,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +12: [2023-05-13 01:00:14,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +23: [2023-05-13 01:00:14,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +23: [2023-05-13 01:00:14,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +10: [2023-05-13 01:00:14,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +10: [2023-05-13 01:00:14,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +25: [2023-05-13 01:00:14,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +25: [2023-05-13 01:00:14,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +25: [2023-05-13 01:00:14,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:14,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:14,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:14,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:14,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:14,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:14,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +16: [2023-05-13 01:00:14,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +16: [2023-05-13 01:00:14,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +25: [2023-05-13 01:00:14,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +31: [2023-05-13 01:00:14,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +25: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:14,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:14,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +31: [2023-05-13 01:00:14,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +13: [2023-05-13 01:00:14,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +13: [2023-05-13 01:00:14,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +26: [2023-05-13 01:00:14,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:14,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:14,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:14,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +16: [2023-05-13 01:00:14,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +26: [2023-05-13 01:00:14,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +16: [2023-05-13 01:00:14,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:14,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:14,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:14,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:14,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +20: [2023-05-13 01:00:14,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +18: [2023-05-13 01:00:14,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +30: [2023-05-13 01:00:14,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:14,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +28: [2023-05-13 01:00:14,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... +24: [2023-05-13 01:00:14,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +28: [2023-05-13 01:00:14,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +14: [2023-05-13 01:00:14,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +16: [2023-05-13 01:00:14,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +18: [2023-05-13 01:00:14,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +27: [2023-05-13 01:00:14,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +30: [2023-05-13 01:00:14,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +29: [2023-05-13 01:00:14,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +24: [2023-05-13 01:00:14,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +21: [2023-05-13 01:00:14,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +20: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_27-model_00-model_states.pt. +15: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +14: [2023-05-13 01:00:14,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:14,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:14,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:14,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:14,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:14,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:14,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:14,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +14: [2023-05-13 01:00:14,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:14,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +27: [2023-05-13 01:00:14,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:14,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +11: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:14,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:14,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +13: [2023-05-13 01:00:14,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:14,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:14,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:14,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +10: [2023-05-13 01:00:14,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +22: [2023-05-13 01:00:14,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +27: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +29: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:14,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +21: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 6: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 2: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +29: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +12: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:14,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:14,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 4: [2023-05-13 01:00:14,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 2: [2023-05-13 01:00:14,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +21: [2023-05-13 01:00:14,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:14,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:14,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +11: [2023-05-13 01:00:14,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:14,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:14,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:14,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:14,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:14,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:14,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:14,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:14,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:14,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:14,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:14,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:14,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +22: [2023-05-13 01:00:14,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:14,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +15: [2023-05-13 01:00:14,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:14,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:14,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +25: [2023-05-13 01:00:14,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +15: [2023-05-13 01:00:14,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +25: [2023-05-13 01:00:14,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +19: [2023-05-13 01:00:14,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:14,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +25: [2023-05-13 01:00:14,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +25: [2023-05-13 01:00:14,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +10: [2023-05-13 01:00:14,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:14,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:14,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:14,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:14,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:14,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:14,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:14,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:14,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:14,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +19: [2023-05-13 01:00:14,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +13: [2023-05-13 01:00:14,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:14,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 0: [2023-05-13 01:00:14,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:14,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:14,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +26: [2023-05-13 01:00:14,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +12: [2023-05-13 01:00:14,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 5: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 9: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:14,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:14,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +23: [2023-05-13 01:00:14,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +17: [2023-05-13 01:00:14,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +17: [2023-05-13 01:00:14,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:14,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:14,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:14,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 0: [2023-05-13 01:00:14,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +23: [2023-05-13 01:00:14,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:14,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +25: [2023-05-13 01:00:14,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:14,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:14,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +26: [2023-05-13 01:00:14,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:14,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +18: [2023-05-13 01:00:14,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:14,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +31: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +31: [2023-05-13 01:00:14,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +28: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +20: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +28: [2023-05-13 01:00:14,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +24: [2023-05-13 01:00:14,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +30: [2023-05-13 01:00:14,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt... +16: [2023-05-13 01:00:14,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:14,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 1: [2023-05-13 01:00:14,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:14,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +20: [2023-05-13 01:00:14,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:14,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:14,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:14,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 3: [2023-05-13 01:00:14,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:14,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:14,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:14,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +18: [2023-05-13 01:00:14,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:14,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:14,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. + 8: [2023-05-13 01:00:14,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +24: [2023-05-13 01:00:14,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +30: [2023-05-13 01:00:14,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_28-model_00-model_states.pt. +16: [2023-05-13 01:00:14,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:14,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:14,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:14,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:14,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:14,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:14,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:15,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:15,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:15,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:15,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:15,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:15,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:15,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:15,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:15,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:15,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:15,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +29: [2023-05-13 01:00:15,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:15,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:15,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:15,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:15,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +27: [2023-05-13 01:00:15,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:15,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:15,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:15,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:15,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:15,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:15,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:15,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:15,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +19: [2023-05-13 01:00:15,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +21: [2023-05-13 01:00:15,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:15,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +10: [2023-05-13 01:00:15,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +11: [2023-05-13 01:00:15,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:15,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:15,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:15,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +14: [2023-05-13 01:00:15,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:15,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:15,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +10: [2023-05-13 01:00:15,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +11: [2023-05-13 01:00:15,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +29: [2023-05-13 01:00:15,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +27: [2023-05-13 01:00:15,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +14: [2023-05-13 01:00:15,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +28: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +26: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +25: [2023-05-13 01:00:15,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:15,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +28: [2023-05-13 01:00:15,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +25: [2023-05-13 01:00:15,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +13: [2023-05-13 01:00:15,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +17: [2023-05-13 01:00:15,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:15,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +13: [2023-05-13 01:00:15,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +17: [2023-05-13 01:00:15,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +21: [2023-05-13 01:00:15,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:15,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +18: [2023-05-13 01:00:15,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +26: [2023-05-13 01:00:15,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +19: [2023-05-13 01:00:15,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +18: [2023-05-13 01:00:15,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:15,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:15,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:15,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:15,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:15,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:15,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:15,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:15,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:15,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +15: [2023-05-13 01:00:15,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:15,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +23: [2023-05-13 01:00:15,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:15,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:15,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:15,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +22: [2023-05-13 01:00:15,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:15,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:15,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:15,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +31: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +30: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +12: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:15,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +24: [2023-05-13 01:00:15,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +20: [2023-05-13 01:00:15,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... +16: [2023-05-13 01:00:15,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +16: [2023-05-13 01:00:15,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +24: [2023-05-13 01:00:15,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +23: [2023-05-13 01:00:15,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +15: [2023-05-13 01:00:15,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +22: [2023-05-13 01:00:15,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +20: [2023-05-13 01:00:15,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +31: [2023-05-13 01:00:15,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +12: [2023-05-13 01:00:15,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. +30: [2023-05-13 01:00:15,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_29-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +14: [2023-05-13 01:00:15,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +14: [2023-05-13 01:00:15,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +27: [2023-05-13 01:00:15,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +27: [2023-05-13 01:00:15,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +27: [2023-05-13 01:00:15,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +10: [2023-05-13 01:00:15,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +10: [2023-05-13 01:00:15,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +10: [2023-05-13 01:00:15,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +26: [2023-05-13 01:00:15,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +14: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt... + 4: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +14: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt... + 4: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +26: [2023-05-13 01:00:15,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +26: [2023-05-13 01:00:15,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 7: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt... + 7: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt... + 7: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt... + 7: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt... +18: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 7: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt... + 7: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt... + 7: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt... + 7: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt... + 6: [2023-05-13 01:00:15,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 6: [2023-05-13 01:00:15,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +21: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +17: [2023-05-13 01:00:15,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +27: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt... +27: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt... +27: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt... +27: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt... +27: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt... +27: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt... +27: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt... +27: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt... +21: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +21: [2023-05-13 01:00:15,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +11: [2023-05-13 01:00:15,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +11: [2023-05-13 01:00:15,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +17: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +17: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +21: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +18: [2023-05-13 01:00:15,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +18: [2023-05-13 01:00:15,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +18: [2023-05-13 01:00:15,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +10: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt... +10: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt... +10: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt... +10: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt... +10: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt... +10: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt... +10: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt... +10: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt... +25: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt... +26: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt... +26: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +26: [2023-05-13 01:00:15,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt... +26: [2023-05-13 01:00:15,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt... +26: [2023-05-13 01:00:15,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt... +26: [2023-05-13 01:00:15,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +16: [2023-05-13 01:00:15,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +15: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +13: [2023-05-13 01:00:15,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +13: [2023-05-13 01:00:15,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +25: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +28: [2023-05-13 01:00:15,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +28: [2023-05-13 01:00:15,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 3: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +25: [2023-05-13 01:00:15,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: > overriding learning rate value to 0.0002 + 0: > overriding minimum learning rate value to 2e-05 + 0: > overriding warmup iterations value to 0 + 0: > overriding total number of iterations value to 1 + 0: > overriding decay style value to cosine +28: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +28: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +17: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt... +17: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt... +17: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt... +17: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt... +17: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt... +17: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt... +17: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt... +17: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +29: [2023-05-13 01:00:15,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +25: [2023-05-13 01:00:15,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 6: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt... + 6: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt... + 6: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt... + 6: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt... + 6: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt... + 6: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt... + 6: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt... + 6: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +19: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +18: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt... +18: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt... +18: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt... +18: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt... +18: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt... +18: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt... +18: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt... +18: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +29: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +29: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +29: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +24: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +11: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt... +11: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt... +11: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +11: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt... +11: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt... +11: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt... +11: [2023-05-13 01:00:15,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt... +11: [2023-05-13 01:00:15,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +12: [2023-05-13 01:00:15,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +30: [2023-05-13 01:00:15,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +20: [2023-05-13 01:00:15,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +21: [2023-05-13 01:00:15,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt... +21: [2023-05-13 01:00:15,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt... +21: [2023-05-13 01:00:15,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt... +21: [2023-05-13 01:00:15,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt... +21: [2023-05-13 01:00:15,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt... +21: [2023-05-13 01:00:15,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt... +21: [2023-05-13 01:00:15,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt... +21: [2023-05-13 01:00:15,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt... +30: [2023-05-13 01:00:15,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +19: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 0: [2023-05-13 01:00:15,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +22: [2023-05-13 01:00:15,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +22: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +31: [2023-05-13 01:00:15,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt... +23: [2023-05-13 01:00:15,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +15: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +23: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +16: [2023-05-13 01:00:15,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +13: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt... +13: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt... +13: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt... +13: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt... +13: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt... +13: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +13: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt... +13: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 9: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +25: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt... +25: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt... +25: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt... +25: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt... +25: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt... +25: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt... +25: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt... +25: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 4: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt... + 4: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt... + 4: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt... + 4: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt... + 4: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt... + 4: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt... +19: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 4: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +22: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +19: [2023-05-13 01:00:15,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt... + 3: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt... + 3: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt... + 3: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt... + 3: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt... + 3: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt... + 3: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 3: [2023-05-13 01:00:15,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +30: [2023-05-13 01:00:15,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 5: [2023-05-13 01:00:15,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 5: [2023-05-13 01:00:15,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +23: [2023-05-13 01:00:15,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 0: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt... + 0: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt... + 0: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt... + 0: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt... + 0: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt... + 0: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt... + 0: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt... + 0: [2023-05-13 01:00:15,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt... +29: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt... + 1: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +28: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt... +28: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt... +28: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt... +28: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt... +28: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt... +28: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt... +28: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt... +28: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +31: [2023-05-13 01:00:15,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +15: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +15: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +24: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt... +23: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt... +23: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt... +23: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt... +23: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt... +23: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +23: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt... +23: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 1: [2023-05-13 01:00:15,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +12: [2023-05-13 01:00:15,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. +20: [2023-05-13 01:00:15,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +16: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +16: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +19: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt... +19: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt... +19: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_30-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 8: [2023-05-13 01:00:15,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 8: [2023-05-13 01:00:15,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +30: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt... +30: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt... +30: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt... +30: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +30: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt... +30: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt... +30: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt... +30: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +24: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +24: [2023-05-13 01:00:15,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 9: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt... + 9: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +20: [2023-05-13 01:00:15,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +12: [2023-05-13 01:00:15,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... +20: [2023-05-13 01:00:15,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +12: [2023-05-13 01:00:15,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 1: [2023-05-13 01:00:15,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt... + 1: [2023-05-13 01:00:15,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt... + 1: [2023-05-13 01:00:15,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt... + 1: [2023-05-13 01:00:15,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt... + 1: [2023-05-13 01:00:15,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt... + 1: [2023-05-13 01:00:15,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt... + 1: [2023-05-13 01:00:15,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt... + 1: [2023-05-13 01:00:15,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. + 2: [2023-05-13 01:00:15,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt... + 2: [2023-05-13 01:00:15,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/layer_32-model_00-model_states.pt. +22: [2023-05-13 01:00:15,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt... +22: [2023-05-13 01:00:15,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt... + 5: [2023-05-13 01:00:15,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt... + 5: [2023-05-13 01:00:15,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt... + 5: [2023-05-13 01:00:15,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt... + 5: [2023-05-13 01:00:15,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt... + 5: [2023-05-13 01:00:15,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt... + 5: [2023-05-13 01:00:15,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt... + 5: [2023-05-13 01:00:15,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt... + 5: [2023-05-13 01:00:15,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt... +16: [2023-05-13 01:00:15,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt... +19: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt... +19: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt... +19: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt... +19: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt... +19: [2023-05-13 01:00:15,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt... +31: [2023-05-13 01:00:15,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt... +31: [2023-05-13 01:00:15,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt... +31: [2023-05-13 01:00:15,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt... +31: [2023-05-13 01:00:15,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt... +31: [2023-05-13 01:00:15,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt... +31: [2023-05-13 01:00:15,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt... +31: [2023-05-13 01:00:15,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt... +31: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt... +15: [2023-05-13 01:00:15,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt... +24: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt... + 8: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt... +20: [2023-05-13 01:00:15,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt. +14: [2023-05-13 01:00:15,916] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 115 +14: [2023-05-13 01:00:15,921] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 115 + 2: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt... + 2: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt. +14: [2023-05-13 01:00:15,924] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 114 +14: [2023-05-13 01:00:15,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt. +14: [2023-05-13 01:00:15,925] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 112 +14: [2023-05-13 01:00:15,928] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 114 +14: [2023-05-13 01:00:15,929] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 112 +12: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt... +12: [2023-05-13 01:00:15,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt... +14: [2023-05-13 01:00:15,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt. +14: [2023-05-13 01:00:15,947] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 117 +14: [2023-05-13 01:00:15,952] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 117 +27: [2023-05-13 01:00:15,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:15,964] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 221 + 7: [2023-05-13 01:00:15,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt. + 7: [2023-05-13 01:00:15,967] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 59 +27: [2023-05-13 01:00:15,968] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 221 + 7: [2023-05-13 01:00:15,970] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 59 +14: [2023-05-13 01:00:15,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt. +14: [2023-05-13 01:00:15,976] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 119 +10: [2023-05-13 01:00:15,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt. +10: [2023-05-13 01:00:15,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt. +10: [2023-05-13 01:00:15,980] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 87 +10: [2023-05-13 01:00:15,980] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 85 +14: [2023-05-13 01:00:15,980] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 119 +10: [2023-05-13 01:00:15,984] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 87 +10: [2023-05-13 01:00:15,984] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 85 + 7: [2023-05-13 01:00:15,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt. + 7: [2023-05-13 01:00:15,996] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 61 + 7: [2023-05-13 01:00:16,001] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 61 +27: [2023-05-13 01:00:16,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,004] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 216 +27: [2023-05-13 01:00:16,008] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 216 +26: [2023-05-13 01:00:16,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,012] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 210 +27: [2023-05-13 01:00:16,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,013] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 217 +27: [2023-05-13 01:00:16,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 217 +26: [2023-05-13 01:00:16,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 210 +17: [2023-05-13 01:00:16,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt. +17: [2023-05-13 01:00:16,022] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 138 +17: [2023-05-13 01:00:16,026] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 138 +14: [2023-05-13 01:00:16,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt. +14: [2023-05-13 01:00:16,035] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 118 +11: [2023-05-13 01:00:16,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt. +11: [2023-05-13 01:00:16,036] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 90 +14: [2023-05-13 01:00:16,039] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 118 +11: [2023-05-13 01:00:16,040] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 90 +10: [2023-05-13 01:00:16,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt. +10: [2023-05-13 01:00:16,043] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 82 +10: [2023-05-13 01:00:16,047] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 82 + 7: [2023-05-13 01:00:16,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt. + 7: [2023-05-13 01:00:16,051] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 57 + 7: [2023-05-13 01:00:16,055] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 57 +26: [2023-05-13 01:00:16,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,058] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 208 +26: [2023-05-13 01:00:16,064] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 208 + 7: [2023-05-13 01:00:16,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,075] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 215 + 7: [2023-05-13 01:00:16,075] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 63 +10: [2023-05-13 01:00:16,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt. +10: [2023-05-13 01:00:16,078] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 84 +26: [2023-05-13 01:00:16,079] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 215 + 7: [2023-05-13 01:00:16,079] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 63 +26: [2023-05-13 01:00:16,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,080] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 211 +10: [2023-05-13 01:00:16,083] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 84 +25: [2023-05-13 01:00:16,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,083] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 206 +18: [2023-05-13 01:00:16,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,084] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 223 +18: [2023-05-13 01:00:16,084] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 148 +26: [2023-05-13 01:00:16,085] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 211 + 6: [2023-05-13 01:00:16,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt. + 7: [2023-05-13 01:00:16,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt. +17: [2023-05-13 01:00:16,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,086] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 52 + 7: [2023-05-13 01:00:16,087] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 60 +17: [2023-05-13 01:00:16,087] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 137 +25: [2023-05-13 01:00:16,088] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 206 +18: [2023-05-13 01:00:16,088] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 148 +27: [2023-05-13 01:00:16,088] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 223 +27: [2023-05-13 01:00:16,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,089] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 218 + 6: [2023-05-13 01:00:16,090] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 52 +17: [2023-05-13 01:00:16,091] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 137 + 7: [2023-05-13 01:00:16,091] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 60 +27: [2023-05-13 01:00:16,093] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 218 + 7: [2023-05-13 01:00:16,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,093] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 219 + 7: [2023-05-13 01:00:16,094] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 58 +26: [2023-05-13 01:00:16,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,095] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 214 +21: [2023-05-13 01:00:16,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt. +21: [2023-05-13 01:00:16,097] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 175 +27: [2023-05-13 01:00:16,097] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 219 + 7: [2023-05-13 01:00:16,098] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 58 +26: [2023-05-13 01:00:16,099] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 214 +21: [2023-05-13 01:00:16,101] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 175 +11: [2023-05-13 01:00:16,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt. +11: [2023-05-13 01:00:16,104] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 92 +17: [2023-05-13 01:00:16,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,107] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 222 +14: [2023-05-13 01:00:16,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt. +17: [2023-05-13 01:00:16,107] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 141 +17: [2023-05-13 01:00:16,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt. +14: [2023-05-13 01:00:16,108] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 113 +17: [2023-05-13 01:00:16,108] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 143 +11: [2023-05-13 01:00:16,109] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 92 +27: [2023-05-13 01:00:16,111] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 222 + 6: [2023-05-13 01:00:16,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,112] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 48 +14: [2023-05-13 01:00:16,113] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 113 +17: [2023-05-13 01:00:16,111] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 141 +17: [2023-05-13 01:00:16,112] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 143 +13: [2023-05-13 01:00:16,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt. +13: [2023-05-13 01:00:16,116] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 110 + 6: [2023-05-13 01:00:16,116] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 48 + 6: [2023-05-13 01:00:16,117] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 50 + 6: [2023-05-13 01:00:16,117] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 55 +18: [2023-05-13 01:00:16,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt. +18: [2023-05-13 01:00:16,120] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 144 + 6: [2023-05-13 01:00:16,120] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 55 +13: [2023-05-13 01:00:16,120] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 110 + 6: [2023-05-13 01:00:16,120] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 50 +18: [2023-05-13 01:00:16,123] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 144 +17: [2023-05-13 01:00:16,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt. +17: [2023-05-13 01:00:16,124] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 136 + 0: [2023-05-13 01:00:16,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt. + 0: [2023-05-13 01:00:16,126] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 2 +25: [2023-05-13 01:00:16,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,127] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 203 +17: [2023-05-13 01:00:16,129] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 136 + 0: [2023-05-13 01:00:16,130] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 2 +25: [2023-05-13 01:00:16,131] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 203 + 7: [2023-05-13 01:00:16,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt. + 7: [2023-05-13 01:00:16,132] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 62 +19: [2023-05-13 01:00:16,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,133] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 159 + 6: [2023-05-13 01:00:16,134] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 51 +16: [2023-05-13 01:00:16,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt. +16: [2023-05-13 01:00:16,135] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 135 + 7: [2023-05-13 01:00:16,136] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 62 +26: [2023-05-13 01:00:16,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,138] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 209 + 6: [2023-05-13 01:00:16,138] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 51 +19: [2023-05-13 01:00:16,138] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 159 +18: [2023-05-13 01:00:16,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt. +18: [2023-05-13 01:00:16,141] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 145 +26: [2023-05-13 01:00:16,141] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 209 +16: [2023-05-13 01:00:16,140] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 135 +18: [2023-05-13 01:00:16,145] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 145 + 0: [2023-05-13 01:00:16,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt. + 0: [2023-05-13 01:00:16,149] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 7 + 0: [2023-05-13 01:00:16,153] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 7 +18: [2023-05-13 01:00:16,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt. +18: [2023-05-13 01:00:16,155] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 149 +10: [2023-05-13 01:00:16,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt. +10: [2023-05-13 01:00:16,155] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 86 +13: [2023-05-13 01:00:16,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt. +13: [2023-05-13 01:00:16,156] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 109 + 0: [2023-05-13 01:00:16,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt. +18: [2023-05-13 01:00:16,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt. +18: [2023-05-13 01:00:16,158] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 149 +18: [2023-05-13 01:00:16,159] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 147 + 0: [2023-05-13 01:00:16,159] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 6 +19: [2023-05-13 01:00:16,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt. +13: [2023-05-13 01:00:16,160] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 109 +19: [2023-05-13 01:00:16,160] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 154 +10: [2023-05-13 01:00:16,161] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 86 +10: [2023-05-13 01:00:16,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt. + 0: [2023-05-13 01:00:16,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt. +10: [2023-05-13 01:00:16,162] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 80 +18: [2023-05-13 01:00:16,162] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 147 + 0: [2023-05-13 01:00:16,162] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 0 + 0: [2023-05-13 01:00:16,163] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 6 +19: [2023-05-13 01:00:16,164] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 154 +23: [2023-05-13 01:00:16,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt. +23: [2023-05-13 01:00:16,166] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 190 +10: [2023-05-13 01:00:16,166] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 80 + 0: [2023-05-13 01:00:16,166] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 0 +23: [2023-05-13 01:00:16,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt. +11: [2023-05-13 01:00:16,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt. +23: [2023-05-13 01:00:16,168] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 191 + 0: could not find arguments in the checkpoint ... + 0: checkpoint version 3.0 +11: [2023-05-13 01:00:16,169] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 88 +23: [2023-05-13 01:00:16,170] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 190 +28: [2023-05-13 01:00:16,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt. +11: [2023-05-13 01:00:16,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt. +28: [2023-05-13 01:00:16,170] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 224 +18: [2023-05-13 01:00:16,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt. +18: [2023-05-13 01:00:16,171] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 151 +11: [2023-05-13 01:00:16,171] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 89 +28: [2023-05-13 01:00:16,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt. +28: [2023-05-13 01:00:16,172] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 231 +11: [2023-05-13 01:00:16,173] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 88 +23: [2023-05-13 01:00:16,173] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 191 +21: [2023-05-13 01:00:16,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,175] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 204 +21: [2023-05-13 01:00:16,175] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 169 +28: [2023-05-13 01:00:16,175] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 224 +18: [2023-05-13 01:00:16,175] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 151 +11: [2023-05-13 01:00:16,175] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 89 +28: [2023-05-13 01:00:16,176] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 231 +18: [2023-05-13 01:00:16,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,178] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 204 +18: [2023-05-13 01:00:16,178] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 146 +21: [2023-05-13 01:00:16,178] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 169 + 7: [2023-05-13 01:00:16,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt. + 7: [2023-05-13 01:00:16,180] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 56 +18: [2023-05-13 01:00:16,182] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 146 + 9: [2023-05-13 01:00:16,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt. + 9: [2023-05-13 01:00:16,183] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 73 + 7: [2023-05-13 01:00:16,184] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 56 +17: [2023-05-13 01:00:16,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt. +28: [2023-05-13 01:00:16,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,186] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 166 +28: [2023-05-13 01:00:16,187] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 227 +17: [2023-05-13 01:00:16,186] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 142 +18: [2023-05-13 01:00:16,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt. +15: [2023-05-13 01:00:16,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt. + 9: [2023-05-13 01:00:16,187] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 73 +18: [2023-05-13 01:00:16,187] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 150 +15: [2023-05-13 01:00:16,187] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 120 +26: [2023-05-13 01:00:16,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,189] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 213 + 3: [2023-05-13 01:00:16,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt. + 3: [2023-05-13 01:00:16,190] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 26 + 3: [2023-05-13 01:00:16,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt. +17: [2023-05-13 01:00:16,190] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 142 + 3: [2023-05-13 01:00:16,191] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 28 +18: [2023-05-13 01:00:16,191] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 150 +28: [2023-05-13 01:00:16,191] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 227 +15: [2023-05-13 01:00:16,191] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 120 +20: [2023-05-13 01:00:16,191] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 166 +19: [2023-05-13 01:00:16,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,192] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 153 +26: [2023-05-13 01:00:16,193] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 213 +11: [2023-05-13 01:00:16,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt. + 3: [2023-05-13 01:00:16,194] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 26 +11: [2023-05-13 01:00:16,194] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 93 + 3: [2023-05-13 01:00:16,195] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 28 + 4: [2023-05-13 01:00:16,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt. + 4: [2023-05-13 01:00:16,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,196] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 153 + 4: [2023-05-13 01:00:16,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt. + 4: [2023-05-13 01:00:16,197] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 34 + 4: [2023-05-13 01:00:16,197] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 35 +11: [2023-05-13 01:00:16,197] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 93 + 4: [2023-05-13 01:00:16,197] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 38 +22: [2023-05-13 01:00:16,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt. +22: [2023-05-13 01:00:16,198] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 176 + 3: [2023-05-13 01:00:16,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,200] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 202 + 3: [2023-05-13 01:00:16,201] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 24 + 4: [2023-05-13 01:00:16,201] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 35 + 4: [2023-05-13 01:00:16,201] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 34 +29: [2023-05-13 01:00:16,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt. + 4: [2023-05-13 01:00:16,201] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 38 +29: [2023-05-13 01:00:16,202] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 237 + 2: [2023-05-13 01:00:16,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt. +22: [2023-05-13 01:00:16,202] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 176 + 2: [2023-05-13 01:00:16,203] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 23 +25: [2023-05-13 01:00:16,203] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 202 +25: [2023-05-13 01:00:16,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,204] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 200 + 3: [2023-05-13 01:00:16,205] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 24 +29: [2023-05-13 01:00:16,206] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 237 + 3: [2023-05-13 01:00:16,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt. + 3: [2023-05-13 01:00:16,207] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 31 + 4: [2023-05-13 01:00:16,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt. + 2: [2023-05-13 01:00:16,207] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 23 +25: [2023-05-13 01:00:16,207] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 200 + 4: [2023-05-13 01:00:16,207] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 33 + 5: [2023-05-13 01:00:16,208] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 42 +21: [2023-05-13 01:00:16,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt. +11: [2023-05-13 01:00:16,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt. +21: [2023-05-13 01:00:16,209] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 171 +11: [2023-05-13 01:00:16,209] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 95 +16: [2023-05-13 01:00:16,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,210] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 233 +16: [2023-05-13 01:00:16,210] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 133 +22: [2023-05-13 01:00:16,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt. + 3: [2023-05-13 01:00:16,210] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 31 +22: [2023-05-13 01:00:16,210] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 183 + 4: [2023-05-13 01:00:16,211] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 33 + 5: [2023-05-13 01:00:16,211] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 42 +13: [2023-05-13 01:00:16,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt. +13: [2023-05-13 01:00:16,212] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 106 +21: [2023-05-13 01:00:16,213] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 171 +11: [2023-05-13 01:00:16,213] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 95 +16: [2023-05-13 01:00:16,213] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 133 +29: [2023-05-13 01:00:16,214] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 233 +22: [2023-05-13 01:00:16,214] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 183 +13: [2023-05-13 01:00:16,216] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 106 +21: [2023-05-13 01:00:16,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt. +21: [2023-05-13 01:00:16,216] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 168 + 0: [2023-05-13 01:00:16,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt. + 0: [2023-05-13 01:00:16,217] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 5 +21: [2023-05-13 01:00:16,220] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 168 + 0: [2023-05-13 01:00:16,220] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 5 +24: [2023-05-13 01:00:16,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt. +24: [2023-05-13 01:00:16,221] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 198 +25: [2023-05-13 01:00:16,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,222] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 201 +27: [2023-05-13 01:00:16,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt. +27: [2023-05-13 01:00:16,223] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 220 + 9: [2023-05-13 01:00:16,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt. + 9: [2023-05-13 01:00:16,224] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 79 + 6: [2023-05-13 01:00:16,224] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 49 + 3: [2023-05-13 01:00:16,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt. + 3: [2023-05-13 01:00:16,226] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 27 +24: [2023-05-13 01:00:16,226] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 198 +10: [2023-05-13 01:00:16,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,226] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 207 +10: [2023-05-13 01:00:16,226] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 81 +25: [2023-05-13 01:00:16,226] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 201 +27: [2023-05-13 01:00:16,227] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 220 +25: [2023-05-13 01:00:16,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt. +25: [2023-05-13 01:00:16,227] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 205 +10: [2023-05-13 01:00:16,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,228] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 49 +10: [2023-05-13 01:00:16,228] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 83 + 9: [2023-05-13 01:00:16,228] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 79 +17: [2023-05-13 01:00:16,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt. +17: [2023-05-13 01:00:16,228] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 140 + 3: [2023-05-13 01:00:16,229] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 27 +10: [2023-05-13 01:00:16,230] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 81 +25: [2023-05-13 01:00:16,230] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 205 +25: [2023-05-13 01:00:16,230] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 207 +16: [2023-05-13 01:00:16,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt. +16: [2023-05-13 01:00:16,231] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 130 +10: [2023-05-13 01:00:16,231] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 83 +11: [2023-05-13 01:00:16,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt. + 4: [2023-05-13 01:00:16,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt. +11: [2023-05-13 01:00:16,232] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 94 + 4: [2023-05-13 01:00:16,232] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 32 +17: [2023-05-13 01:00:16,232] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 140 + 6: [2023-05-13 01:00:16,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,234] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 54 +19: [2023-05-13 01:00:16,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt. +16: [2023-05-13 01:00:16,235] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 130 +19: [2023-05-13 01:00:16,235] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 152 + 4: [2023-05-13 01:00:16,236] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 32 + 3: [2023-05-13 01:00:16,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,236] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 255 + 3: [2023-05-13 01:00:16,237] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 29 +11: [2023-05-13 01:00:16,237] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 94 + 0: [2023-05-13 01:00:16,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt. + 0: [2023-05-13 01:00:16,238] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 3 + 6: [2023-05-13 01:00:16,238] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 54 + 8: [2023-05-13 01:00:16,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt. + 8: [2023-05-13 01:00:16,239] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 64 +31: [2023-05-13 01:00:16,239] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 255 + 9: [2023-05-13 01:00:16,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,239] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 152 + 9: [2023-05-13 01:00:16,240] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 74 + 3: [2023-05-13 01:00:16,241] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 29 + 4: [2023-05-13 01:00:16,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt. + 0: [2023-05-13 01:00:16,242] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 3 + 4: [2023-05-13 01:00:16,242] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 39 +16: [2023-05-13 01:00:16,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,243] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 239 + 8: [2023-05-13 01:00:16,243] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 64 +16: [2023-05-13 01:00:16,243] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 129 + 9: [2023-05-13 01:00:16,243] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 74 +16: [2023-05-13 01:00:16,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt. +16: [2023-05-13 01:00:16,244] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 131 + 4: [2023-05-13 01:00:16,245] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 39 + 5: [2023-05-13 01:00:16,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,247] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 46 + 9: [2023-05-13 01:00:16,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,248] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 239 + 9: [2023-05-13 01:00:16,247] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 77 +16: [2023-05-13 01:00:16,248] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 129 +16: [2023-05-13 01:00:16,248] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 131 +31: [2023-05-13 01:00:16,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,249] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 251 +31: [2023-05-13 01:00:16,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,249] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 250 +29: [2023-05-13 01:00:16,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt. +16: [2023-05-13 01:00:16,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,250] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 236 +16: [2023-05-13 01:00:16,250] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 132 + 5: [2023-05-13 01:00:16,251] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 46 + 9: [2023-05-13 01:00:16,251] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 77 +13: [2023-05-13 01:00:16,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt. +13: [2023-05-13 01:00:16,252] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 105 + 0: [2023-05-13 01:00:16,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt. +16: [2023-05-13 01:00:16,254] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 132 +29: [2023-05-13 01:00:16,254] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 236 +31: [2023-05-13 01:00:16,254] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 251 + 0: [2023-05-13 01:00:16,254] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 1 +31: [2023-05-13 01:00:16,254] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 250 + 3: [2023-05-13 01:00:16,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt. + 3: [2023-05-13 01:00:16,255] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 30 + 1: [2023-05-13 01:00:16,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt. + 1: [2023-05-13 01:00:16,256] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 11 +30: [2023-05-13 01:00:16,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,256] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 165 +13: [2023-05-13 01:00:16,256] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 105 +30: [2023-05-13 01:00:16,256] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 240 + 1: [2023-05-13 01:00:16,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt. + 1: [2023-05-13 01:00:16,257] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 15 +28: [2023-05-13 01:00:16,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt. +28: [2023-05-13 01:00:16,258] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 226 + 0: [2023-05-13 01:00:16,258] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 1 + 3: [2023-05-13 01:00:16,259] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 30 + 1: [2023-05-13 01:00:16,260] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 11 +15: [2023-05-13 01:00:16,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,261] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 240 +15: [2023-05-13 01:00:16,261] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 127 +20: [2023-05-13 01:00:16,260] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 165 +29: [2023-05-13 01:00:16,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,261] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 238 + 1: [2023-05-13 01:00:16,261] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 15 +28: [2023-05-13 01:00:16,262] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 226 +23: [2023-05-13 01:00:16,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt. +23: [2023-05-13 01:00:16,263] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 188 +31: [2023-05-13 01:00:16,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,263] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 254 +23: [2023-05-13 01:00:16,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt. +23: [2023-05-13 01:00:16,264] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 189 + 5: [2023-05-13 01:00:16,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt. +15: [2023-05-13 01:00:16,265] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 127 + 5: [2023-05-13 01:00:16,265] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 40 +29: [2023-05-13 01:00:16,266] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 238 +28: [2023-05-13 01:00:16,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt. +28: [2023-05-13 01:00:16,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt. +28: [2023-05-13 01:00:16,267] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 228 +28: [2023-05-13 01:00:16,267] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 225 +23: [2023-05-13 01:00:16,267] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 188 +31: [2023-05-13 01:00:16,267] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 254 + 5: [2023-05-13 01:00:16,269] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 40 +23: [2023-05-13 01:00:16,268] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 189 +17: [2023-05-13 01:00:16,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt. +17: [2023-05-13 01:00:16,269] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 139 +29: [2023-05-13 01:00:16,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,271] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 234 +11: [2023-05-13 01:00:16,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt. +15: [2023-05-13 01:00:16,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt. +17: [2023-05-13 01:00:16,273] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 139 +11: [2023-05-13 01:00:16,273] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 91 +28: [2023-05-13 01:00:16,273] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 228 +28: [2023-05-13 01:00:16,273] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 225 +15: [2023-05-13 01:00:16,273] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 121 +13: [2023-05-13 01:00:16,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt. + 1: [2023-05-13 01:00:16,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt. +13: [2023-05-13 01:00:16,274] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 104 + 1: [2023-05-13 01:00:16,274] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 10 +29: [2023-05-13 01:00:16,275] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 234 +22: [2023-05-13 01:00:16,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt. +22: [2023-05-13 01:00:16,275] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 179 +15: [2023-05-13 01:00:16,276] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 121 +11: [2023-05-13 01:00:16,277] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 91 +22: [2023-05-13 01:00:16,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt. +22: [2023-05-13 01:00:16,277] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 178 +13: [2023-05-13 01:00:16,278] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 104 + 1: [2023-05-13 01:00:16,278] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 10 +30: [2023-05-13 01:00:16,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,279] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 244 +22: [2023-05-13 01:00:16,281] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 179 +23: [2023-05-13 01:00:16,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt. +22: [2023-05-13 01:00:16,281] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 178 +23: [2023-05-13 01:00:16,281] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 186 +22: [2023-05-13 01:00:16,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt. +22: [2023-05-13 01:00:16,282] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 177 + 4: [2023-05-13 01:00:16,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,283] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 244 + 4: [2023-05-13 01:00:16,283] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 36 +30: [2023-05-13 01:00:16,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,284] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 246 +15: [2023-05-13 01:00:16,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt. +15: [2023-05-13 01:00:16,285] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 124 +22: [2023-05-13 01:00:16,285] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 177 +23: [2023-05-13 01:00:16,285] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 186 + 4: [2023-05-13 01:00:16,287] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 36 +30: [2023-05-13 01:00:16,288] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 246 +19: [2023-05-13 01:00:16,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,288] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 249 +19: [2023-05-13 01:00:16,288] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 158 +15: [2023-05-13 01:00:16,289] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 124 + 1: [2023-05-13 01:00:16,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt. + 1: [2023-05-13 01:00:16,290] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 8 + 1: [2023-05-13 01:00:16,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt. + 1: [2023-05-13 01:00:16,291] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 9 +31: [2023-05-13 01:00:16,292] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 249 +12: [2023-05-13 01:00:16,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt. +15: [2023-05-13 01:00:16,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,293] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 158 +12: [2023-05-13 01:00:16,293] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 102 +15: [2023-05-13 01:00:16,293] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 125 +16: [2023-05-13 01:00:16,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt. +16: [2023-05-13 01:00:16,293] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 128 +31: [2023-05-13 01:00:16,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,294] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 248 + 1: [2023-05-13 01:00:16,294] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 8 + 1: [2023-05-13 01:00:16,296] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 9 +15: [2023-05-13 01:00:16,297] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 125 +12: [2023-05-13 01:00:16,297] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 102 +31: [2023-05-13 01:00:16,297] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 248 +16: [2023-05-13 01:00:16,298] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 128 +24: [2023-05-13 01:00:16,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt. +24: [2023-05-13 01:00:16,302] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 194 +21: [2023-05-13 01:00:16,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt. +21: [2023-05-13 01:00:16,303] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 173 +30: [2023-05-13 01:00:16,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,304] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 243 + 1: [2023-05-13 01:00:16,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt. + 1: [2023-05-13 01:00:16,305] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 12 +24: [2023-05-13 01:00:16,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt. +24: [2023-05-13 01:00:16,305] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 193 +30: [2023-05-13 01:00:16,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,306] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 247 +24: [2023-05-13 01:00:16,306] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 194 +21: [2023-05-13 01:00:16,307] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 173 + 3: [2023-05-13 01:00:16,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,308] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 243 +28: [2023-05-13 01:00:16,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt. +28: [2023-05-13 01:00:16,308] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 230 + 3: [2023-05-13 01:00:16,308] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 25 + 5: [2023-05-13 01:00:16,309] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 47 +24: [2023-05-13 01:00:16,308] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 193 + 1: [2023-05-13 01:00:16,309] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 12 +30: [2023-05-13 01:00:16,310] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 247 +19: [2023-05-13 01:00:16,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,311] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 155 + 3: [2023-05-13 01:00:16,311] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 25 +28: [2023-05-13 01:00:16,312] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 230 +12: [2023-05-13 01:00:16,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt. +12: [2023-05-13 01:00:16,312] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 96 + 5: [2023-05-13 01:00:16,313] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 47 +15: [2023-05-13 01:00:16,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,313] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 43 + 2: [2023-05-13 01:00:16,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt. +15: [2023-05-13 01:00:16,313] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 123 + 2: [2023-05-13 01:00:16,314] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 17 +22: [2023-05-13 01:00:16,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt. +21: [2023-05-13 01:00:16,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt. +22: [2023-05-13 01:00:16,314] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 181 +21: [2023-05-13 01:00:16,315] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 172 +16: [2023-05-13 01:00:16,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt. +16: [2023-05-13 01:00:16,315] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 134 +12: [2023-05-13 01:00:16,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,315] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 155 +12: [2023-05-13 01:00:16,316] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 103 +12: [2023-05-13 01:00:16,316] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 96 + 6: [2023-05-13 01:00:16,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt. +24: [2023-05-13 01:00:16,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,317] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 43 +15: [2023-05-13 01:00:16,317] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 123 +24: [2023-05-13 01:00:16,317] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 196 + 6: [2023-05-13 01:00:16,318] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 53 +22: [2023-05-13 01:00:16,318] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 181 +21: [2023-05-13 01:00:16,318] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 172 + 2: [2023-05-13 01:00:16,319] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 17 +13: [2023-05-13 01:00:16,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt. +12: [2023-05-13 01:00:16,320] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 103 +13: [2023-05-13 01:00:16,320] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 111 +16: [2023-05-13 01:00:16,319] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 134 +22: [2023-05-13 01:00:16,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt. + 6: [2023-05-13 01:00:16,321] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 53 +24: [2023-05-13 01:00:16,321] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 196 +22: [2023-05-13 01:00:16,321] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 180 +12: [2023-05-13 01:00:16,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt. +12: [2023-05-13 01:00:16,322] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 97 + 1: [2023-05-13 01:00:16,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt. + 1: [2023-05-13 01:00:16,323] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 13 +13: [2023-05-13 01:00:16,324] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 111 +22: [2023-05-13 01:00:16,324] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 180 +15: [2023-05-13 01:00:16,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt. +15: [2023-05-13 01:00:16,326] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 126 +12: [2023-05-13 01:00:16,326] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 97 + 1: [2023-05-13 01:00:16,327] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 13 +20: [2023-05-13 01:00:16,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,328] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 162 +15: [2023-05-13 01:00:16,330] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 126 + 1: [2023-05-13 01:00:16,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt. +12: [2023-05-13 01:00:16,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt. + 1: [2023-05-13 01:00:16,332] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 14 +12: [2023-05-13 01:00:16,332] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 98 +20: [2023-05-13 01:00:16,333] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 162 + 1: [2023-05-13 01:00:16,335] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 14 + 0: [2023-05-13 01:00:16,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt. + 8: [2023-05-13 01:00:16,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt. + 8: [2023-05-13 01:00:16,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt. +12: [2023-05-13 01:00:16,336] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 98 + 0: [2023-05-13 01:00:16,337] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 4 + 8: [2023-05-13 01:00:16,337] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 69 + 8: [2023-05-13 01:00:16,337] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 65 +12: [2023-05-13 01:00:16,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt. +12: [2023-05-13 01:00:16,339] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 101 + 0: [2023-05-13 01:00:16,340] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 4 + 8: [2023-05-13 01:00:16,340] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 69 + 8: [2023-05-13 01:00:16,341] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 65 +12: [2023-05-13 01:00:16,342] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 101 +24: [2023-05-13 01:00:16,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt. +24: [2023-05-13 01:00:16,346] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 197 +30: [2023-05-13 01:00:16,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,348] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 245 +23: [2023-05-13 01:00:16,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt. +23: [2023-05-13 01:00:16,349] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 184 +24: [2023-05-13 01:00:16,350] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 197 +30: [2023-05-13 01:00:16,352] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 245 +23: [2023-05-13 01:00:16,353] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 184 +29: [2023-05-13 01:00:16,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:16,354] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 235 +19: [2023-05-13 01:00:16,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt. +19: [2023-05-13 01:00:16,355] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 156 +19: [2023-05-13 01:00:16,355] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 157 + 2: [2023-05-13 01:00:16,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt. + 2: [2023-05-13 01:00:16,357] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 21 +29: [2023-05-13 01:00:16,358] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 235 +23: [2023-05-13 01:00:16,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt. +23: [2023-05-13 01:00:16,359] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 185 +30: [2023-05-13 01:00:16,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,359] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 241 +19: [2023-05-13 01:00:16,360] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 157 +19: [2023-05-13 01:00:16,360] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 156 + 2: [2023-05-13 01:00:16,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt. + 2: [2023-05-13 01:00:16,361] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 21 + 8: [2023-05-13 01:00:16,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt. + 2: [2023-05-13 01:00:16,361] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 16 +24: [2023-05-13 01:00:16,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt. + 8: [2023-05-13 01:00:16,362] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 67 +24: [2023-05-13 01:00:16,362] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 192 +30: [2023-05-13 01:00:16,363] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 241 +23: [2023-05-13 01:00:16,363] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 185 + 5: [2023-05-13 01:00:16,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt. + 8: [2023-05-13 01:00:16,365] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 67 + 5: [2023-05-13 01:00:16,365] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 41 + 2: [2023-05-13 01:00:16,366] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 16 +24: [2023-05-13 01:00:16,366] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 192 +22: [2023-05-13 01:00:16,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt. +22: [2023-05-13 01:00:16,368] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 182 + 8: [2023-05-13 01:00:16,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,369] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 41 + 8: [2023-05-13 01:00:16,370] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 71 +20: [2023-05-13 01:00:16,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,371] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 163 +22: [2023-05-13 01:00:16,371] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 182 + 8: [2023-05-13 01:00:16,373] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 71 +24: [2023-05-13 01:00:16,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt. +24: [2023-05-13 01:00:16,374] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 195 +20: [2023-05-13 01:00:16,374] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 163 + 8: [2023-05-13 01:00:16,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt. +24: [2023-05-13 01:00:16,377] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 195 + 8: [2023-05-13 01:00:16,377] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 70 + 2: [2023-05-13 01:00:16,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt. + 2: [2023-05-13 01:00:16,379] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 18 + 9: [2023-05-13 01:00:16,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt. + 9: [2023-05-13 01:00:16,381] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 75 + 8: [2023-05-13 01:00:16,381] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 70 + 2: [2023-05-13 01:00:16,382] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 18 +20: [2023-05-13 01:00:16,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,383] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 164 + 9: [2023-05-13 01:00:16,384] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 75 +31: [2023-05-13 01:00:16,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,386] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 252 +20: [2023-05-13 01:00:16,387] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 164 + 2: [2023-05-13 01:00:16,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt. + 2: [2023-05-13 01:00:16,388] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 19 +31: [2023-05-13 01:00:16,390] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 252 + 2: [2023-05-13 01:00:16,392] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 19 + 4: [2023-05-13 01:00:16,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt. + 4: [2023-05-13 01:00:16,393] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 37 + 2: [2023-05-13 01:00:16,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt. + 2: [2023-05-13 01:00:16,397] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 22 + 4: [2023-05-13 01:00:16,397] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 37 + 2: [2023-05-13 01:00:16,401] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 22 +20: [2023-05-13 01:00:16,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,407] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 161 +20: [2023-05-13 01:00:16,410] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 161 +31: [2023-05-13 01:00:16,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt. +31: [2023-05-13 01:00:16,412] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 253 +31: [2023-05-13 01:00:16,415] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 253 + 5: [2023-05-13 01:00:16,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,417] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 44 + 5: [2023-05-13 01:00:16,421] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 44 +24: [2023-05-13 01:00:16,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt. +24: [2023-05-13 01:00:16,422] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 199 +24: [2023-05-13 01:00:16,426] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 199 +20: [2023-05-13 01:00:16,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,433] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 160 +21: [2023-05-13 01:00:16,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt. +21: [2023-05-13 01:00:16,437] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 170 +20: [2023-05-13 01:00:16,437] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 160 +21: [2023-05-13 01:00:16,440] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 170 + 2: [2023-05-13 01:00:16,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt. + 2: [2023-05-13 01:00:16,447] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 20 + 2: [2023-05-13 01:00:16,451] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 20 + 8: [2023-05-13 01:00:16,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt. + 8: [2023-05-13 01:00:16,453] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 66 + 8: [2023-05-13 01:00:16,456] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 66 +13: [2023-05-13 01:00:16,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt. +13: [2023-05-13 01:00:16,458] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 107 +13: [2023-05-13 01:00:16,462] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 107 + 5: [2023-05-13 01:00:16,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt. + 5: [2023-05-13 01:00:16,464] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 45 + 5: [2023-05-13 01:00:16,468] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 45 +30: [2023-05-13 01:00:16,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt. +30: [2023-05-13 01:00:16,501] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 242 +30: [2023-05-13 01:00:16,504] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 242 + 9: [2023-05-13 01:00:16,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt. + 9: [2023-05-13 01:00:16,515] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 78 + 9: [2023-05-13 01:00:16,518] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 78 +12: [2023-05-13 01:00:16,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt. +12: [2023-05-13 01:00:16,589] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 100 +12: [2023-05-13 01:00:16,592] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 100 +23: [2023-05-13 01:00:16,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt. +23: [2023-05-13 01:00:16,605] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 187 +23: [2023-05-13 01:00:16,609] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 187 +14: [2023-05-13 01:00:16,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt. +14: [2023-05-13 01:00:16,696] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 116 +14: [2023-05-13 01:00:16,700] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 116 +15: [2023-05-13 01:00:16,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt. +15: [2023-05-13 01:00:16,738] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 122 +15: [2023-05-13 01:00:16,741] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 122 +20: [2023-05-13 01:00:16,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt. +20: [2023-05-13 01:00:16,747] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 167 +20: [2023-05-13 01:00:16,751] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 167 +13: [2023-05-13 01:00:16,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt. +13: [2023-05-13 01:00:16,761] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 108 +13: [2023-05-13 01:00:16,765] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 108 + 8: [2023-05-13 01:00:16,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt. + 8: [2023-05-13 01:00:16,817] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 68 + 8: [2023-05-13 01:00:16,822] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 68 +26: [2023-05-13 01:00:16,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt. +26: [2023-05-13 01:00:16,884] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 212 +26: [2023-05-13 01:00:16,888] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 212 + 9: [2023-05-13 01:00:17,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt. + 9: [2023-05-13 01:00:17,569] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 72 + 9: [2023-05-13 01:00:17,573] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 72 +29: [2023-05-13 01:00:17,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt. +29: [2023-05-13 01:00:17,575] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 232 +28: [2023-05-13 01:00:17,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt. +28: [2023-05-13 01:00:17,575] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 229 +29: [2023-05-13 01:00:17,578] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 232 +28: [2023-05-13 01:00:17,579] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 229 +12: [2023-05-13 01:00:17,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt. +12: [2023-05-13 01:00:17,704] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 99 +12: [2023-05-13 01:00:17,707] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 99 +21: [2023-05-13 01:00:17,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt. +21: [2023-05-13 01:00:17,793] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 174 +21: [2023-05-13 01:00:17,797] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 174 + 9: [2023-05-13 01:00:17,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3/global_step78678/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt. + 9: [2023-05-13 01:00:17,808] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 76 + 9: [2023-05-13 01:00:17,811] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 76 + 0: successfully loaded checkpoint from lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3 at iteration 0 +31: time (ms) | load-checkpoint: 15109.17 + 0: estimated model parameters: 1.905090048 + 0: estimated model parameters without embeddings: 1.78447104 + 0: [after model, optimizer, and learning rate scheduler are built] datetime: 2023-05-13 01:00:18 + 0: > building train, validation, and test datasets ... + 0: > datasets target sizes (minimum size): + 0: train: 1 + 0: validation: 51200 + 0: test: 51200 + 0: > building train, validation, and test datasets for GPT ... + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.038029 seconds + 0: number of documents: 3133972 + 0: > dataset split: + 0: train: + 0: document indices in [0, 3133972) total of 3133972 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.146 seconds + 0: total number of samples: 731002 + 0: total number of epochs: 1 + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.085978 seconds + 0: number of documents: 364608 + 0: > dataset split: + 0: validation: + 0: document indices in [0, 364608) total of 364608 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.106 seconds + 0: total number of samples: 84978 + 0: total number of epochs: 1 + 0: > finished creating GPT datasets ... + 0: [after dataloaders are built] datetime: 2023-05-13 01:00:40 + 0: done with setup ... + 0: training ... +31: time (ms) | model-and-optimizer-setup: 50381.12 | train/valid/test-data-iterators-setup: 21303.28 + 0: [after training is done] datetime: 2023-05-13 01:00:40 +31: ----------------------------------------------------------------------------------------------------------------- +31: validation loss at the end of training for val data | lm loss value: 2.692264E+00 | lm loss PPL: 1.476507E+01 | +31: ----------------------------------------------------------------------------------------------------------------- +END 3509629: Sat 13 May 2023 01:01:26 AM EEST diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb7883502eca235cdb3a3d5f09965ca7d64cd9d5 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c233e4594a2cbcac464e471eb8b7eb2bed0eb8d863e604124732116e164ac6c +size 89305623 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d54e835b3da9ce5ebc8229a080172ddcf19073ff --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41a07774bc6da46fb8ec94777cf31dad1d74ad4d51085ff77eb4c7898b6ad47b +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31dba7425fa84decafd0a4508efaa0f428afec8f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f83ea48c4ee0e465d759d6af1fffcbabb911260dcba51bfd45325dca5d9f3fa +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aee8a57812a6c1621cac5e01c7d1a91710b0b986 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:199e504ce516e4cce9ea4877c57d45a3a8bd9f7cf9fd1cc0abe68b1dbfe08a63 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2f9a8adc6d15732c13d611f41be030b889d997e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1040305f355f4edac081ea64a9cb9694bee75f5c664ce16e691859d5f331266 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67d37c5237a72c87bb2defaf2aff6ec859da4fd0 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7bab41abb44db96b6112774c46d3487127f4c7f87f56dab181d34a21abee8a2 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..393eefde720b696d15cf984e8ac4a77aa4f78870 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d827555d6a30166241f2c93c98eabd3541c0d936e07b20ef0b84c034c4961bf1 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce4ff1566378563bcbda6ada1f2d5eb7f49f7189 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff18d833dd189b3130ea5a8a0fdeb29e9dfa69c18083f7045bfaad3ac8fea974 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aae52d8c2117e28256bcd5aa4504ac15f7081df1 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e30331e8e6c3d04227d57771cf85304198fd72b3ac64ddbfbdb7d5ab54943a +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c26e93d11a838d477f515b4c8d57310faa8bca1d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6570f496cae4bded18a86b4d12615dacd61408317ee04ba9414f5101b6fb33dd +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ba72ee99bd02ddda44755cd16d95eeeab4159bd --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94b206af23dbb5f63777146020a08466ca0c625b5093420b9c543e6a50e80b6a +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a0433fade31908671676e4e846c70d33ea954f1 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf9cd6adabba324a34e3c25fa5e7a000dd4a437382f088eee9108091ffeefa2 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2749f1786bbaccc6db0a0aa3de2f2ac1cc75469 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11931536875208c6b801d167ef02fd6581f9f90d4f8b34435b90b4dd9ae5e149 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49141ee65a343c511d2415272718ded6f9a7db6b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b14925da0b5c2fe8d6bf8befba8f83c19470e1d60707c016ec9a752bbc0a63ad +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cce2c7f73047439f3150b51c6229f446115ca82a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e700972369a9acb7a771fb7953d08c89465f10d9707405754a7d263c8b9e3773 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6cd608949c147f6ee640ca7b7f1f84fe8d002fb --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:163eaa2f238b1ff8cfd19a02e1bdbe48383c7dd785d7a947a760578abc063182 +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..089dbfe0a8d00eb98bffa96c3e521233cfddc139 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eff1ec6d7ebb87bfe6386da211a7cfad68e72270263793a9045af8c71bac66a +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f603bf24dd9b1222332520ee530de4a6102541a6 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515be5bc9a53850f99b2c5d837ef34b200206b87c681164f857e89549757ac2e +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9bf4c91b22028357cec4e016c83e22e0f39f773 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c040b3f21dceaf58dd84a2c5a7e402125953e1da4d02b35d90d362c3af9784 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..751fedceab290abd7ed7f8f0c586789a6c92edb4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2066ca41e6a2a8c3f536afab6beb34e7bc73fa7fb550e72e75a741ce6cd8d9 +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69d5286321a3e97cb21a22324c8b1188d32e14ea --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e41efdeec2fa5b708bbc6fad4cfdd6c0b9240053ccfe8fd8c10dac4f5be8ed +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2582f9adc0a01aa5104cf69a689e3684d628e1a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c3c0e12f337eb3b550eb3af930f6a63ea923f726e58c6795c21e1195ff985d +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d9d6d2497c9cce9f308f53f9012bb580fc132a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c088234d3956117f971b61fdea2427843e92bcd5ee1e1d45679da097c82f275 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d01da529154d83ee9a915d9ffb3677c3553cad3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2c39a3e458c23aecd63b7e3aa2afa0ee649bcbee17c2759ffe4ebcb34f7abf6 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e4b46c2753dc4d00af609166194f1cce4094c80 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b6164cb3ac7cb71e611b2471ce6e5f99128a69ac43d74adb12094f7f8219e1f +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41b3f9f2330a9104337cd4a450fad21e4c134fac --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c313b12fefcaaba5196d231daeeb1810ddf1747c8dc3aa61dc7c1bd893cbb7d1 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09dc46ff51795847cb0965a8a175380597350f0 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f7bebe92295a2b29e4a6810c328a312975a46696b4e906d39ef8dbafe7514c +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e673bb75aefe2fcdce43e00b903d09e9678a4713 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a67e6d53d4f1cdd0f6777f209605ebdbbbd04847f21a12cf049cc05809082a +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da93fd08e7c8172b13eee19b383bc14e83a5193d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d532cf1fb931816a16ceb4bdf14c6bc4b9045fa1e6e4dbd0334c23a8d707ca9f +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a0702cdd7c8cb71ced3a6dbac1f47563c0a576f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b964809ffcb296688ba144d5b83f08803e94e9163280f92e296802e35951653 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c4e884dcd2c96e3525823ee07e80eadc7e8a8a3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c135909113ad6b136817548c504223a30b31776960746e002dbd47dc12cd6e77 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3e67440a109d4f15880ed045e2eb3f88be0343a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f074f3444bf41dd359102c1bfeec719f4e1a2875f904a1b2491d6b2abbc00ae +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f59c96ee7470844e8d3774ec204c6fc33ef12157 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fe0df73e51f9f820d7b2c0dc4f377e6a38ce5c3da753ea0a808a9733034f494 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d5700ad77df24a1dc2a2e0229430838a4d2b70 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bfae5a179b780ecc56b8e17f1695e5cba9a8dcea8eda357de4b5199027ee68f +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40bff9c21a263fccd251b702669cad284b15822e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb6c9dcc7debd93010e482f47334eb4c8d6b0a3d048e902edd4f8cee0639d0f +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..070295723c8a3a1dcb575e7abda650746a602c8f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78500ba3c3f43040d06cb5e5d021328c70353f42ae3f923ac1c549d139bd6087 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f44a023331dacd9e3a25abafac4bfb5dc2953a1 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad644446c000a95a4811c97c6e621b22a4b9fce6b87bc489ef408908446af21 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a86dfc502ec371b0e7bac894e2cd0f4aac1897d1 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cff855ee884f204039e848ece50028feee2bb0cb84df0680855007c7c882aef +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a1dadb7f7be897d13e33ed529cff98c4ea32710 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb798d42e9c2be3a0e60f2ba15723cfd99197894e74418d9f1d89855b24119c7 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c27b1d56d702f2fbfe74131a9238391a3dea1f3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7055063c0b63e319c4f7d93684cd935145cf5a1ff6263b62d36dace0e8bc572 +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30c5ad7d42d91354ced2a2fad5324fda8c2959d5 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22d85edc6b228892a933fa7408026680ace6c3b6809939d6853f87c57f9b543d +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e768a0ed856d9958a89a57528905431288968ce --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cfe7df6ebcf8b1fe15117ad39e691b9833b139b19eeee8717d93faa95602f98 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cb6f045d2d0784b3e8b63db163f3ed7f910df19 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1347e8d49e4652554766dd2b0b278a765f74c6cfe84981e463972bd0aa28283a +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8435f070324923e5de445fb2ab0326d8610e1bf7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:553e44f9b06f0ef3648b94adf6f8e72e3e388d062d9684a646a4d20b264c6c65 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4271fa062372c73cd554ea1e46c06fa2aa29e9f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acbb2254dfc1c71be30f95750ddfa121edc8a38a15a60d03e75257162325a1b4 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95759d890fe51b8056c17f4570ad51424d8057b3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af44140977ae11baf52eb729cd8ef4470ae016512d5336fd9b7352879b9bbf8f +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7d2ba40272e083db7a29b081f154e4b9f672bbb --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387bfe53938eba0eb26d355eaf35c46834beece162faba12d603369c6e8161d6 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78c6f856c03d2cec018e0fca6238deb235d8e5df --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10d10de874b2c8c359d1e11c77a3cf14c4afadf7960f390af9891c44370b1814 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..922a5ea2693bd93a7bd430c6064a5d46bed0d0b3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea17a76d2218105fc35876364c3e2b4c94361119bd37a1e113d58de6786ab1a1 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0b70ec1eb11dd178a32f41293e1746588be546a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7326b5d509e40107189c80bb92c8699515bb689e80c3b439f7d3a861390acfb6 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dec1a473937b7ceacc258e4c0bd21338025b3e10 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3383f4e29c3a70fce5780ee78ddedf67633303d9eebd6b7c346aef1df1d40fee +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8506198d8f01a58e1a621456cead64b8b3365b6 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1dab395ee568f757d4790d372e847cb24a71d7be8513b85699fed0c8b9aa91 +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36ba2ece8b143ceb1c09b7681e3f2057d7f6281f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35127ca4893e1844d2fd98b72860550c70877803c047d8123c2f32decfa8571 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a63cee67e50b127002cda8ceabf75c5f0475945 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bff8cc9e48f2377a10be814268a3ef2cd2e3fdfe44b79e5f7944f50ed771f79 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47183d6f705b3a02e1d261d0beb3d8f8b7ad9f7f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d855b2c42597aaeb33e105fc8412ede47b92d9a5779589c03ea80cc6d71b2b1 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b9d23bfaac44597785bb0cb9d856b37345ba7d3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590ccddd9bdf499702f1050721062c89ff6bb5dd08868c635a93c8bb47956d0e +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..767a5bf3686e8cb2ed05d45f79bac7eb626cf109 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcf61a44af7684e70a61744e8deadf815633ba414d15dda90967efd8f6f72af7 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe411782a39b922af5cdc8a81b94fe86295823f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d2394f704d3a1e762d7e8ef11aa91285e2acc69b7755076b7e669b31dd65b0 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec026b4dae64bc18d3df06c837acc4c25dd4630 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f49f168616a1b6a9002d366681deb17f38463f047df314c9c279e836bb59b21 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..def689ea5df3ba9522e85a758eed36aab0990bf4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:839222cf8fce34104ff05096653ae60d92b148489c1ea0c48054588467af5305 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f072a5e4fac3c64043e025999b1c4340c326fb22 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca92da0c29f2331f5b71c39b92b942f1645343c2b326a8dfa4136bf67d8e4e5 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ce13f7e2f70143df9ab27a7564e217e95471a79 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e67f60dc8c793a8a1964b85f43cdd6387fbfc973925bb8f0421bf7f6db4f11a6 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51132943b5aba9ef4ba049a4902c55bcbdfb4d9 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff23ff5ff0a9b595455bc331019d39fc4cc6964e12eda6cad1ea15f836eadecb +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a50c7a070a3d34475ecca70e3cbf65c99398f0c2 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:075d9930dce716b7a98d1f0dc5e65e79d30d90370338c544a6c97f0f58dc1ba9 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41c52d414eb7015a9ea021cc7e1d74a5dd44da6f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9486a1773eaf0bad6c07f5758ddd4e11495c23527a7fb4d2669b15a2494f8edf +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4013ac82c4482c9869d967c4cb89c561902eb388 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:099cac790aa184b4e637b9dc5a0089b67235bfda2247b4b523fad6e979e0bb17 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ceee04a0b69ea76b0447d55a486cd62ab246ad --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89491fa2572803795f71fdb312acc639d2ccffa31d9a962563ca4119c31ceea9 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a2f06f8809dd8143db0e53d564727bff22ffeff --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21c856d3236e937be5361f081b2a2b0e97378e542999b6b9bb94cba8c27fc9e +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7330281e2e4bb852a1338516210a91b064a72658 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff65ec55dd0c77a375304fea679c7db7a608e3bb74b038734066e2e674580948 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8570eb39c231e72039b46df2cca2094f00c96ce --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:401acccf5577672f3335e04743a97f81afd7591f9bb40b30fd66d81d1b0cee5c +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48f786c820b97bebf3026be6c53f4df2fecde79d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7fe0c55b28d5a08a8372e103a81283ccf701ff9cc94abe7ec1be44fd1768eb9 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeae100a6eceb3384c831c7ec35868f11e522bd4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164a5a73a4af635468b57d7d5d5b097f0598a06869711db12f44a2eff918adb2 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85dc6605f86b4e3207ba7b53b9af400d01e241a4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75324f160b1ca5ef442f1a0dd5f4316fd1355376bc26d16519d962dcd98bf9db +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c86160d6028b44998b5b3295374862ebc6d3df4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5b26627831b7638d78447cea9c52487f85a0e4e70a925df54e6940dfd6b041 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdb8e1e5f6af3a08e2cd267ae4543de63d099acf --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78eeec8583e4b44db5985c8ab93987150385dbd6e903d21df64554c34400b56f +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef86170eb5ed368f57d788d8a54513646950319 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a18a1136215b4ded6657dc2c9d5c97749ec558322021182a6634720340bb2a3e +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12db99dad2eb0c9afa0a7d8b92776761b5022caf --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f4df2cc23b86ee9e8877200e8729c31257bbc606024bab4c9d69057fd85a498 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ab272c8dda7ef6a02ae540a0bc64c00ca34fe77 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daca3c512c8d0bedfe5b2436cfd421cb57ace2a6ed0d2e75cab35e2e02f8667b +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..383a4bdfd9e584f04e25c0715e869829b3d55e7e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f97990ae32952415402bc6c07a59d9676eeac74285a25fed87e7689553e3ac0 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4c89f2fe154769ee60244101c918384ff8f329 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4b6eda475f1f5abf03d4b364ca61daac07671209496f9367e60a397d82d46ce +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c6d320d4a6c45659d014e62b3d7554ed156e974 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a403162a3e58698a77a54659e7a2fc2b06a28dd4076238341684849b8a4e6042 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09ffbd12bc33a7565387b5c8026bac79100c35df --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:937c9e9c979c7225454463c4be1a6856ed3272c675b38651624c394ab6f49942 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f4ab41e1cd45a1438ab27cece219ccf2bc504f0 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bab4056c4e9e85fbfd7c645d1fe30999a23e7bfe98e9351718ef355aac51e58 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5afcb09d20f9101ce990664a2e68e444ef1d6957 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc43a9935348960280be77ecfdd8910926a874bbe786e60c447e197e17841d31 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b8c4d4dbb8761249ac30eb1a3bd9870d4a3428a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee71b7726a6918cbb5668e211f87181269173fbe1fc19df661b000cb6a45522 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9996e4b9ae914a9d04e5b86f542722034bef068 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e892668a6dc725724da57585b04a0dcffc0ac53f57f46226757ea048bd3acc1 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f576529f73353194415635bf63c74dd5df308173 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5910cd1155c9effb887b1b6680c9e7d536e0230f2597ced2002147293ab784 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ee54d10e5e5453661a239e11c9b6e14031fbb7f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2fdc1a34528b45b742fe8302091f0056859224b0f88fbc71ae2a0fd9f9e5f4 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..382e8619d6eacbcfff7d33b8501213f5b1ea6059 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b4c1516ac149f37b81246539a7df1d93a1136c6759a5a00017a22f25a49efdb +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e79312803f4131919b6594e1b5a85ae0b42c27de --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f849524e300b7287a3339ef3d6f067882213cccf654e59a08b9661d216db33 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6277d2efaa7b75fd12c8aa4653ac39d7ae18ffca --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1cff98c83fd2c792f7fbe4470458a5e8f2eea4826ab3577971ea553692208e0 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72565321ada40a96b0b2947fb288820130e3444f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:527bb1bded938842eabcf2e198019f4f6e8e16363e82d8dcf02928273af87e7f +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11d552e7e35aba7b67c178e0d342938d8996482c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f95cfaae58a262f76e84c29cdd0b40d587aa19d56da3210e2a42ac00fa96520 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0aa93294d38f98368b90f61231612f3a7dac9ff --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54386fbc821fb45fd4e39c62e57aeff84b00e5ce2c8ec2fb28a280e41507e273 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5d978f4c6f1d8ba1ba4dc96041f2441ec34759d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed2aeb1fc9512f8b6a760ed9a5bc7247e625a2aff7ab6c22e904c8ea71ab8baf +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28bd03d13e21f5f061c7692a2e16bbe58a4846e9 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dce715675a1b5e9f18bcb8da89aa86653a672504b21f3f592ea9c04616ed2453 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70cd4e1dbf9c5c27a86818e68577cc9acd6bbd3d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212b11d30f4b4fe1721e33c77578af5ad65367959c0be7fcd5cc1529d78d9139 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b7466c3b020c0f42646e43eb3a3c68d2d2640a8 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc9990ecdca58a61bbd51bc4db3200483e9c175cc87161cd11377086159dc3b1 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c63bc70c0977661e96b47d0d03ff68d2cc88547a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9c0c326ccaaba125c4e8a2cb6b5eb7213bead88bf1f00f782f236d7f3dfd216 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34ad1b6d60caf04f5b1d005b8695e9b44dd8ff2c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aece9ccaf351618bb90c0ff231790c8d85544f65b3f7074c456c7fe5e083ade5 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56690d8c50608db8ee914b6c312038c24ed3303 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc28ad085b7f5ab60a1010843f732f33fbd4909cae9a257c1d166822ce4593b +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42a5511bbf1f24ba5c3614ac7ac60ed3c4941e83 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6753058b17f23c330b06934de390df4270395c3ad998fd06aac0b1b64ed628c3 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cbab1a0732bd96a6e206f3f45898cfd36045f2b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f4a9048441edbba0659a6ded2acda48788be9ebe9b5283a00d7875fa8c97b02 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c38b18816be972cccd9f526b200592674f7362 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ef60337c38ad676ac9f4ac060055f5c707e30a5a6108c9a27a42c1538f623c +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9969c5ac5c49bd4c5edaa7c085f5e9d4e50fcb13 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a680bb3281d0222afc609de6ba8588519da52f10b9c87dd0abc856cfde5a2532 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6a6caa2f69279ce5a6979ad6d595875cfc0a6ee --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:789245221ef6f3e3d97f346a315f7fd8bab3f3629d3485e8fe06040225545f77 +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4ae544f2f094f1da86e6ae5bb4fc55c9403f80 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d891042ae314c131d3401799c5f7bad4ba597257870c5a23c1d4ebe4451ee724 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..998302964571fa433682fa0be0cc7332d6a6b4c1 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fffe4aae0fdd000497cd7c73d66cf35a3803cac10787cc4a0f1de4dce6ccb473 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0669cdf8bc5d3e20cffb666df0e64ded88b28e45 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d74af726b88862d79e4da0bf38071fe4534f2947b50c71b3ff85d5d8109fbc40 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9ebe3cba12c786293e1f11182d4217b675fca27 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:061f691e298fe89fa990f5f72f47e8029ef4177e070e4d0834b6eb920e49a370 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21102a6f2e1245eeef468f26f2fc2a2c4c5556db --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22395b3afc1b69eabe10825170a740c7149525aad358daf3f8fd3a4acf91087 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebece946c6aa281cfd779a9ac435a3430faa098d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91b1f0e4cc30bfb8f4b1d5b21f7bfcb642815d6ba4a763046320160049dee01 +size 89305623 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00f3fad485fcd3bbc7856e4fcf199fc4ce12064c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e8ff8daf208609622fd0d5b0e563f8804fd6df76513dfaaddc305f357cc14e +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b07ad1cc0d940e716c44f110a0f62fbb8aa9684 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb2ad73780432ada30edde8e6830532afbc465b6da8d9ad52d65c986837a68c8 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e30cec26ecdf194feb9d9b0da04e8661ee15e6c7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe954dab87e3f18595e0ad4b8da18d66e0cc7fc996858a6c714d9dfcaec08fe +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4324b530b18266795c2cdce12f9641793f6dad8d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:550052068d6e0ecceb28474b89f81cb9b5f0606310a6c4e2f3ec938e0c372f3d +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d810239fc05d9c78aa2c61c01a4bc2d49034503 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebbf7021c965e1670ec81ad37f9a763a300e56cec2bd28328c6bceb6a499eb86 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaa57bdfc42b37a90239bdbdc77018e6c2a24bb6 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4904f7df88720ea941fd5610d9ad1fcf40b4ae00efe5499685ee0eb79bb57c57 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ab0b8895056f895d703bf905b73478d98ca3de --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a056190f8244ec01528e94e65f1af91ce10dc320ed7326cd42805d8abd2b07 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a8587a4aa0b9e36a8d897a8f9fdd779e522e22e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efebe62cfdbce515b6082fbc382dc4174a8c4fb653c3d12d8f6c92858353537c +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ccd7303ce88fae696824d2f3c6466d2117c64a2 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47e794b4f13cf8b85952e0f36d381c281c31a9d05bad7b4db1c3fc946b1f23f +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e35f397ce0a82dc0e359de950bcc43bfa56ab9e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71881588017d35b571b7102f21bb8abaf627d3c2e01f22b2b03349ae9f4de3a7 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf846f73261570716f463894d3102b9e08d311d7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3044758bcce827f433b1a7cc37e393a2cbc683450f41271714bca68e119e0fcc +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79de10e0aef01fe313efad7c399a66f7ac5dbed8 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a56b4534a8a96c73bac131d6952ebf0a29c091df10787726af6fc335e7e59de +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70d73df4a84af4922ae1bb4cf31ddd592ff16646 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e17ca1e0b728f0661b7d99fe14a79017825b847a3e33035ecd00c6d415b5a88c +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a77a460699309f7e7ebde8bd00a871b0309e905 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4fd6e39f5cfd2e74b90ecdaa9a56621ffae952f24e7461ab86a415f1dd8132 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..527f36ffabee5d8c68a5d2f7365a072b3c0cfce0 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d195588023e0f70b0af846065a4ef022368a7fdaac2a80f03a323ed16c7440e +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bddfbc394eca770f77a484e8baabe29bbeb6d54 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd0e62a9bc79cf24098f5327509cd51e72493c1c3fba161358378e6c0a4b5c3c +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..933e47656803c13077794c434959995b6004470d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:871ef5b0b3a39a9c4b5334f4175c0b3196019cb440c0d5cfe3c70f41e344bde9 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec87f9697bcdd27d6943769771aa89d1e205192a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:336f2de63549718b4ab08b97547843107dec0f4207e2caf0afa5b00e16ab8c4c +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de654f716a1ec91e662a6c5df283ca6375200958 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81ac58370e4eef9f27c5f2fa5ea9bf9ca043351fc278c512d5aa5e72f47258a4 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69dbe3b36734d86a4a65417fd408acbca4e5c005 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac62cd8779f1f74ee3c37c02ea59ad90e1bee58a83d7d5a811529701395b6f45 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88e121bbd012495d506304f346aa97d7535da076 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e169f4c94e7134b5d18fc6f01694a488632952eea7f66990fd1f67f3eb1ff420 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c3d0181de7732512676233b0604e0cb379c5ff1 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054d6b78bfdd595b2448f65354bfe9ea2a39f059feb26cdd5707e63d8e42445a +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83149f24300c87f8fa9b11e651980a52848c0f48 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d8881d2f69ab402964cfc6cf3b9a8b2ccf02a0c64a8f5c7b4a85e68296bd98 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb11dfedacbe8cb8214ba77ce72297d3eccf3760 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e920f6a7ac45716b2833a3599efdea421aac64c57448040225d21f0301075b9 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02464a0820a7b4830090d6af1dccba90cdff42b9 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6db40ef750e00907c1d64835f7ed93a89c61b0ad5554428da1f5ee5a0caade9 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa4aa7c0092361d05f44d3c83ca2b6e014452a27 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b8c2af22f0968e8301e3dc93d1a61800055a86384c746421ba53abc490028ab +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bc4be7035d0a72071024196b4ff6819afd22193 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee20b5f257a7a07f09e581244c03b00af5dae8ed0639ed37cbbc221b2c2fd8b +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..837d3fdf8924bd21ca147288197d8181f8a726ac --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09248bac1527ca8095bc5194c42135806428fb8bb5154fed17104299e495aa8e +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cd45f292c881aab627dfff119384b3f5abc1753 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f03482862ec65b176b519cdae83ede9d378c3da3c92a46770a672f842f7a32f5 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3208286b0f921f02c074eda0c0405ee52e981b37 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a0c1a819d59869cdad606892c4ab45320297dae7672bf8d14f9713a0c13d9ff +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed67e4ea32aa4dab87c4ae972a793a4a54ccb9da --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e635ad162d48d5a09f996a97438d27097641e28d5e0261d7000792255f83679 +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda691394337ac1436bc59502b1bac66f609a060 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc2201d6f37f0bda4920016595c53993f4f68aa48858b7f8488bc4c38aaa587c +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fc30c7d44d6017ff84c50bb5a52c74e94f6f5e7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f78fe104f0511f7db1d58cda9b19bcbdde41fb6b554329fe869cb72ea00e35e3 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..852d0851adfe5156c123e431b28c52940f7927e9 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b49b78995cbc68fd61b3441cba4d26dc33204f536887f06e22cf26461227cc7b +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0b44084b05cbc8c48de231f8be6f23ed5a0fee8 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1a030d4a6f7ed9a16c426d9c49e6a2130b68645118fd392794bd24969da200 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37a539c3f458da0529b3b3a11767b74d3fe106d3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffd163775e6157a2a66de32b6ba6eb22aff5760d62ac53daec78ac6bcb11fda +size 89305837 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba133facf4ebab9309e37d87d3b8d43e6d1346fb --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ceaaafa876cca830f84cca5cef4aa28f31d4768dd19f165bea581a24884e2ac +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a9766799ae5ed28af7da181fede7e996c43d9b2 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a9d20c7a4ca7948abbe7832430bf81143961f18f4546f8f17247da4e1f5593b +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba20a1d21e3fec55f175af677cfd670b193c30fd --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08b4d614f457e4fde73ada6db9d0623590592ac1133f3c704f7b6d6c9767c92 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a90d38ebe203ff0db411b5a31e2bb8b7b208746 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8041ff3018d6f0975e99b28c86c05cee85a0c6b09d89f8b2f3ad1ae60f191a8 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82b653dad330aa3ed8992908cce86778a0c4ff16 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b6ab19c8af5b69536d6de9ab975fcf6ff4fdcdd6d4e46536abd457fe6ff7d36 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26c7786c6e0834297d94bb0a69db2039373a8fcf --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef15b09fb37dc8f2770041d3c31e93e624f593eb780eeeae846846176538c3ee +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..387c26e692d09d47c068f25838ac1c3fca9e64f8 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be927fb9f6fc7b093e25fd281da85e4519f71e13dd820cabaad78a07d84c421 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..119e87492b648bee3141a19a9e2344fff8cfba4a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3aa4965d9dda0ff5f11475904ff024136dc89aa22b69a3cf63e822550bcac9e +size 89305762 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9da9606c7879a27f496ddf84a0046dc844e0603 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c2c36ebc03c7cc701fef504797553186fa3bec31bb62352b6c42c1b6224031 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5568bdc0e22aa0543fc33b3c6a30c974359ad80 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e783b644629009a3916db2a51a19b0876e564d349d0a86ed0538edb620f6bfb7 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f94d28bb957ded4ee05c10fe4b19ed44247dca61 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46700029d23a25d87a36e3dc0b5e969d16cbd0d8c5d62d3f723c26202e6d6edb +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3aaa54ef7923498edf92c33aaebf8ca769c8f55 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e305e7212aae98277ce14f064d74f75a36e4af3164519c7cf19c0032eac3028e +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4718035e42f10cc13a43f3d887e986b64c5f49c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3511891501e33bc9a7c6ec410fb85718a8c54d1bdf5ac2e5b75ecdcf3617034f +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a319760d6f88d0ccb8761a1758ada6e51e0c6884 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac5e9bc235746c7095f3b178722b34620fcbad572ab4875aedf8a4e3bfc0f93f +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a36afb73bd008116409fb0e3cc4ed90bf4f8755 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4501a19fbce9c8ab1c8d5e55e8c5208a1fd7f89e3564a5c277191b03179a3c1 +size 89305709 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de4e7fc420d19ec6887d31583b5d0b22353c5e55 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b733995538a6de539c18495316380763dc117f1254de11a11dac1df7b939e5a +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b527320d536621425c20de1adf1acf3231b409f4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:107384988fe5fec71e5d57c10d535c6728130bb725096811a1d1754372172434 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01a5794fb975e18222bbb504b8aa9d1789fa7abc --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb429e6f4c2b90418c47e0e1f31b8f8b9cc92d8a48211dc81eac5ae3aac67e8 +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a136b5cc758666092e891257735d24e1f9c19279 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec74e6352f20fd1c926e450836763cb15626ccc3d9bd978965e54cf7c3c4dcc +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c699531eb1d71ae30aead965bb980a856a7dfba9 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85296c7d3c031bccdf860272a15a715226c78b15527da5ae92d9f1cf3cb0b7a8 +size 89305773 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed5b800381cd51227d9bacd61d0b389ab6caf7df --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade004572ae8d9d4967f36d333e1fe13d2179dd9f05d0afb0f22aad687651f25 +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77b7252b03d05cf4ef3819cd9ad8a8259cbc9f4c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5d37fa4d303361293b95c57f5601e0c7bf1b29f8c63886d2842dcb218d3e7b4 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de2de50ba3a818f8097e2a4f2dab25ec18509768 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2c3bf93227104d17efec52825d0cfddf7b1451d563d26d0c5a7beff62e6bcd +size 89305645 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a5f64244a1bb9386d13f2297ab1c60db87622df --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106fb9ca5740b8bef3651192352d35833b8c5a07705d0063139b0730da219abe +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71e3c1ca9f783e0394f53c670232bdee4f879ef6 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e4646092667d69022d5956b6f0310524fcf412dea916229688c562cc3b56109 +size 89305581 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f001fd3bb60ae4cf32258666d46b394bffa941e5 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c59d36964ead497bd15d7736ad912af31b86b476ff2e35d475ed6a85b202116 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00025abc9336ac5f9c8f82605df4ba0b23decda9 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fcefeacf06a104758d65b32d526c3bb0d0e10ed6e4c8ba167a76e7d6bdb04f3 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4f0c03973d166d1e02e3c06a2a49acfd3e5528a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27242990db7e60ffbd9a38c49c38e42c0fb1565a4e6b48ca7b0cb1f87f450559 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb06cd0f1099b4ba9ecda5a25c6cc9fd1214666e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1be2afc136dfcac921bae7beb26b2e3bbe834ee0869ad9fda3aed3698de58c8 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1269ba23f75fc3d6efd775a77db92d3fe1bf6c53 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf502cfcf5b94c39dbd6d533718df72ce8912a47a1a03b9fc883f9debb128ee +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2f508e0aa34792610dc52e3a9dd2a684090384e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a062dfe59d9e32d2c5323cdaa3d771498d8311e88e3bd5141cb65973d2c508f +size 89305559 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99578163ff9c094da1c1f750aa7900d521325c9b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b6645f06269489a34d7d4ed5dd68755847680fae5f1eeb80b7b338a19f4217 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aa718f59b1eada499e50d110fa979941ffa97b3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830c91bd3d7092765726dc2cd2d1a31af1360887b806f5a4f763d3a32e18a560 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f88459a2b6abe5e6b0874ae55e413d2051ad7f3e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67d34885d0c135ceb107768581197ea8f630327a5d13ed324f6eab13cef29df7 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2b3b8e76ccd9bb5a583a059efac2775a5cdb2b2 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ffa4e977a811b056868cc1b51fc6d5c9c7a00ac6f340e6a604b234e8202d65 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05ebc30a6393c545c82cea638ea271c0208ab992 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37c79f734f0c4c09a431afa1bd813fb63f0557159cb9b62f76d3e3c36d79afe5 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c722d35e85b70e3f590be020aad8a3102ebbad93 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e6328d512c0f0b6c9f9af65ba18d403dfa83973f490adffbd437517cb19012 +size 89305762 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6535ae392c127d43130a3b90bca3353ac5325dbd --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7439e7d1f2595a39bdb5d4fb4ae6a4e0aebc170ab7e4386df4fd9337b34d5be2 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a49eadab99fb46886ca9ab4d99fe723dee87a4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba0cf3c03b5bec3b1c450c77c7450de73de67449143a849d2f109fdca96715c +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e62f13977ea78102567a379c3f804ecee7f02e72 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:357a2f4ef8b1fb6c2d34968b2de8433571dc676198e858e213035bd67d88c7d3 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52415e34c7632e444dbcc8e612757edb4ac5db4b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91beddb4d5df6d9359e41a0d3356706d1dbdc0fbb18ccc9b87dd46f53289163 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a620c2b4e2a34c893cf67744e2e72fed64327dfa --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de77f3be86d2f836df043be7aa949d834eb2c5504d895f4be4d7405a324a54c0 +size 89305623 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3bc12d3388700226529ece92c3385ab88f5b1d0 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241a02c10dcb91f138e5401d0b65228bf8f635631bb746b7f78cb3494b5a99f2 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e4b40328adfb15dd7942bd8c99d441b0f81cd57 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63aa4d7eaeffab145378f18125b3bcb12ba983f0e694722db3f96f1b0c805725 +size 89305762 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a8612231118797d6a615c66511cc26784da6848 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5a26fc75e0a2655e80a149e33f783e90edb6b9e7914fcb069adcf2de70de277 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c476968036f00f2d1808737ba16283ecb5c4f69 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d147cf578464e1e4da40bfa15879e6f8d88d1b080bdb16a924edc2e6d280537 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d2630f3229bb8f7a88104e703952e81a05b60e0 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7636c32f525b8168bbe0f43414bdeb20030775adecc80083b4584ca1b6c317d +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a646e66719109ecc0e8a6746d96d72f261be0228 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c18e390c537751ee7a1e35f013153f36a9686edc90f89f7a78abfe8d58ee906a +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7dc47bcaa17dd3bd36e8541765a1bcc070c6be1 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c031bffcb2adc5dbe9bb196f6c466037b771e8722bb35a66c72c8313e9cece +size 89305762 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7952eb8974aa792a1e192bab486a35feb77d4fc --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a764b1e4cd82f77719e3bfabb0821ab97d208ba92e0456314bd368f54d969e1 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9ca9973f332a8531cbc69eacfd75ed438dfe206 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d808528567f5eacc3535b2def099c9cf7efa2357ff2f302331a96ab5cb32aa8f +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbeca4c0b30e6211e5c9c3758aa216ce8e9b2a2f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:300f0034cdfc712a0a1873018ef8d17379033279379bb022abadb66d3ac36eb8 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa5b6957ff110728e90c73b8689d529c16d0750c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5552c9c1a11234494f981ed8d6bf7cda1f45dbb6c918514a599d0d325345816 +size 89305687 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9d6d07020bcd2e087b9d6eac46a1fcd313f7c33 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1040f8a76d6609cad0d702b50dde5906ac9efe7c07b8b2ae28688a50e221bdd5 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e324c014127bef86cda10b577f87be82a681e61 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5ff71a36f2f06e1f3479855e2bc37c8ee78634573605bb00620f317452cf4d4 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..147363ea5c8551c5a4010b94ac4eabea9dbca20d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edcc933825938cc7f072e551ed964dd0af471ebb0d1c0d753f75a5e5d0d3e241 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d20076231aeb17ca68ec7b43ffe6b6b8a7415e7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc35e29eb5a6b38e6609040b472ea5c592eb6ae01f0209b77755a1e538172db6 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb0f896457f3c757379170d94f9d01ffe0fd164f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8963d4d707644e168b6ec6e01f168b06e5947e7f8f7e350b8d53551a876720 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15f643d98105a189c564ca8f9baadf540821de12 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164dff2aad59ebfba27dad8b3e6029c2c456f17c72d1e78f209089fd360b7e39 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..512a6ce1bbbfcd0664100903831ecd39a816e146 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c45d5ad35dd23ae180768165a9fd7e59a81bc1cb3b08ff9a1782802e64be4cf +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c911717356df9be7d5955f2a83b74e69de886c86 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a91c9fa90a4e328dc0c8757d3781737c4e0b85478497e3bdaf42c1c034b7ca4 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c456250eeadfd12fd3074246b21afdf9824ba28 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7346c1ed9213911c247f93e3c6c09c022c77c5419989f3fa609861d5c357effb +size 89305762 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a4497d31995b4ab404a262de145b4e5fda75e7e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9c22e2bbedc884c18aecd40212639daeddb85e205cebdacab30e076bfc9558 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33f2cce46df974da83ec90cb8daeaa3cf728d823 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a1ab5329346443c94caf028f252ce46ebf55fb7ca0ecbf76f534145a773d04 +size 89305687 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d00e2046a7f8b3451678d892ce352231276d47ad --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fda6a5f711fe85bda3b3af0faf90a9149f54214d2037a794d3bf753dccd66d8 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..def8be39a486091f40fdb6bd522795f5be45b63b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1bb46cfeaf5de76589c06e5dbcfd78c51fdd67608c56b83a5112d274052193f +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaf0ede7f0876ee336beaa751c7cfa516003cb9c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f13bd1b6c8e0039c8dab3042004041a8064701fd70cc7849380394c6fe21ecd0 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f715d17d782dcb569b69916b1af236691115e7e6 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfcb9547368243063b89970d84116e85f9b0a988b2d6a7cbcbeff6a1ffa47bd1 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62a626edcf39eb92f2b56f771c718895a5a2892c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a820c65ca34f2a22d9053e5b39f23bd78ef3e131943bfb2faa380453b5300e72 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea562fd75500c9ebf4e247dd48ff7e668f4b2b24 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8985e3905c5835499003bcb9d0923b60ca5afe07be1b413875eabfaf5e2792d +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c28074b7ee567fcd4b3c6370f313d2789aeb9942 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734c4ae59ce1825ca14f05f20cbb418be2ef042cc5389477b2b2baf99839a208 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9b134a0358112e9cbe8216c77870802db932a0a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cdaad22d42f67a382528da848ec37dc40ee0d339211ef6e7a6d5807a5c1bc35 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9f533c4daf6f2ee90630a8ccd919babf04afc8e --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f2a4dd3671429c95d49d6723ff77224b73f58c0555820b4c043cc569964c9b +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8277adce91fd51f2a16d3bef32a8d538d6883b25 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c8e7d96d5e05b75ab74439d4543ed03701edd80c18166204ebe6019c8d6f35 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed54024a08c68a66fc179f45b67c25409a04cf40 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64728e621cdbb0b8b0e084622a6cc2cbd61dc176fd9f4b8e2d9d8c5096c9f92c +size 89305559 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c929ba8b1933e1820acc939f52ce69763e2c410c --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8087fb6976d16dce907d0f71a232f600abc5f94af87bdefdfc76d569e9e1aaab +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd401d8328ba26cfe37554baf28346f17ce047d3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34db4a08e9a5d4bbd47d2d00ae1249382d73af0343e31a052ff30c0a95cbe0f +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8af0e4d73ecd07b95fb274b559b6378d9f836ad0 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974f4e2e91d93eed8236759bf4490ecd9cc5577ece8004472ab6ddf0ae034e52 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..621118bfdb404890cd1571e735c6bba3c9a846bc --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:500d8fb17b4fc219a9f2d432e3f87734c70a078dffbbe24a41904aa5fe5f0d0b +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1cc7d5b716033d9147fabde922ed77d07f00269 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3178ba8bed8825d8eb8153f7853878fefbd0c64e93b3095183a7a34e84248ea0 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e31e62bb36301a289a715506bb7d9851903274b4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aec7c4b882fa4c08cc9da965219bd2f0bb7ec5bd1a5817ed72f1b748746044c3 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4451e4351a7e9041a710e31ad1195c3f799816c6 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6728d39b7f66e9a3db361e4f7d4ddecb428cd6b0fc6eb6a891b43b0c8714f81e +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a77f684c3cbdcd5081514185b43abfdb20a7afdc --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:727131ea94dc69351dc1852b0d7e663c8e29ff807ff91506ec5c9a108c5f62c6 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd686316896debf2e33285983a3b9a2bfd9e8254 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849e8633e29dbf7e3eea28ecf2d1c28d32b3f5fc77baf4e07ed53fefc0868dab +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de3c6995692a1bfcfdac57069775355b2c2d9322 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c30f7f17aad9d464dbc2f90b241f5444025d037d056129dd6ee26f15455f44a +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dc9da9a8407884f8edc14578edadc8242180c72 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:534e922df9db65d4141202e579c75b64528870b6115e295bd4be230e31485ceb +size 89305559 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e29de52e9bd40c18e4bb3f0b328a580462e24e43 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:902e5285fc76c9874022c4277b1b832a7dc4c6c26879421bad2b91dbbd5b41d3 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6cbcf042551f0fe17c3628d58624af796ccb78b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2865514ef9b3247b6422fc1bba3c819e09eb06725e8fa1710a0876ae70c28f3e +size 89305762 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84a9f243fc99863bc8f2bc5dead9ed8986d4bcc0 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5042e26e38b873ffa18b879ae25763f2007f7804bd8627dd742112a9fd50a280 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a26b9546cd910e17fe7573ac9e7733424be51952 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ab0d1c691afec588b419f4565f3a2ad0ec599fad32c7701052ad27dcb7465b0 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0da774ca88dae5bb92d322f5cb2f32b6fea623 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe353e4173612c1efe38bf9ef6201f2b949fcc2f7fd74dcf6efe382fe43be30 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..173171c12e40ed18049dc0d9d428a8aeaea53d33 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:267779d00c3d9fc19802a8fafbbd806b393cdebabcf303915eb2926b1aa14eee +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c864bee5e93e655dfdb8bbb5c921d7e4441b15d --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46c4c58b664e4afc662ecb8000b54bcb178f2deb661c5ccae452647abd7541ac +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be2ffefd49cc0602845106f2849fa264e7e012d7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acc31f34a737268cfd9846f749da1773856aa1889233f3b7d253ac89b41548d1 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..863bbac26b97626987721a1af1af550ac43a68a2 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428b3b200fc88b483f138c7c13b3c28277fc7e063e1287b2a1cbaa0646a71899 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f3275ee801edbdf20e9a5e7610f7a690ddd1033 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22662dcb5d38ef25d5d6c9f2cd54e4c4e36ecc843875f59749004962266c39fe +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0682edcb29632ace7e4362132635dd9011eb0857 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0deaa695f037a09d382c1582c810ca625d86981f9593ac0751ff767ff7e8558d +size 89305623 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d5adc212551dbfe57fb5dd5e6afa6b78706e4b4 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ab0d5fea63d822180d7f0cdba0c045fc918436029589b7cc8cbc10e29fa208 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..851d6392d706a85d915000b85006d19280bda1bb --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d3670c0a4206f65a941aa5da95a7d5f1abfdb8b42c115369ace13daae78045 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..792b3fcb8ce7643e4242157d63f139746d5415a7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:321719c7ecd4d43d68b7871fabc8b81c476c8a9d03593a24baf09a4770b6b1c0 +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcab60181182c8f3d8f570c0d7daa2cf875ee64b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8774818f8171112a40a91f4e1e614128677a9c9d115a0fde1651b6b1905bc34 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e3d36ab9b1f2543935bd041d521335e80388a28 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acab7639028ceb7705df765c97aaedd5c4533e91e725f7d9d86d9017a3a648ad +size 89305634 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ac65dd2c48b32e51ed93d0f9853c2b296e3ae6a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde16a0a139effd26cf0270f199df7a312760723d9661501a38bc0581add9b5f +size 89305762 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81c541b3701d7ebd5e37f9eb31e235b12d6e22c3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f7973f0781467335547bcb0033550af44af5a00758c62a2b17bbb54d524650 +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adaa7454dfbc983a613a8a8cb5d64fe2d70f6280 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c8b712b6adb210274f9cbf70ab4878a8950f414aeec49cb81784564fc08642b +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f61085249faf361bd1970eda093564b01588952f --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ddedf9960e20b37232d159f81117e65da3cb1325614692090f821bbbffdf1a7 +size 89305570 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..726db8e1f106215e4dfda15b7e670017f3340abb --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32da357a9b3d425dbfe24a83c850841e8ad4e5a005d333d78a8295e9903c4d6f +size 89305698 diff --git a/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20cebc7003e7dfc61827f7e70c797943e67e4758 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55f0d12c5024b1691fa7d9a830e2336da6552eee17f2cbf8408694d1b0ecc60 +size 89305687 diff --git a/2b855b4bc4opt2/global_step78678/layer_01-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad7ff7ec2e7e7af1f6d492f8ee430c52bbfef3a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:483ccbad3482e68d736097ce1f45e5b703a46d906847bd72f2b5d1ffcd7921c5 +size 241239299 diff --git a/2b855b4bc4opt2/global_step78678/layer_03-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c76b1728dcf7126565cf2826a0b5ef8219e257b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23c48390392cfe8c9bbb7083bef3a9ffa37c8774136cc46e97d2b85e4ef7443b +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_04-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e08ea1b6d04788e097bba8b22a9e631408b2eaf3 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89184858384c4481c9bd2d16a33a85449cfba9e6ebd5dad446ce6dbd07f732b2 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_05-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d92efd10af7a024edcdffb896d1d61bca32e183 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b0e6fb27a684ac7355e1feb223a33f8ee9fd95499f674a793479dcb53488417 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_06-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbcd35a3e8ecd8a4be554b87d56466326696a654 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcffcebb4364d981e278d0b49d735edcc48c4cba7a904e27521ffedec6bc99bd +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_07-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95b5da25a9ca6419c472ec43cc165744a43dda04 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:281c3fee3386156e99aa814c0b4d1fb38f75f32455ce1fb8f6e31f09134aa2df +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_08-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc227d4c26e148d4e90503ee79c574e4aa60f7aa --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d4a5ad40c7228b9dcbc4fcc3b5595a1e2f5caafc6439854849e59bb016d9c7 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_09-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dadc448f9ca980debb5f52b93906d3ded991fb5 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b90463dcf2ab6c24a0f887bb6e349072ece5c0d15cb065f6f3f2c5698415589 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_10-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f358ccf368b6b80939775b3690b1bfed7cb67021 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e48d0a07a9cb5f6debc19315f66267133ebf5b42553973a0b59b7fc40b95d2c3 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_11-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d0fc17d804fb5ee702e096515c05ea6e2db3924 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:252176bf900a39e7cc6bf022d6d8927d24520340f7018eff3aaf210e17bb7862 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_12-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7639517fa96ae594865d8ab76cc02ecda257f5bb --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61800605a739927e4496d5415ba94acd6a47c5f16616fb4c67145622c1cb6ea4 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_13-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22d252883dcee9b7c3e3933a6c08006a0da17bb7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1118c817fdef67c58919d47789301bf9712373b820eb507c364af4036c3cd39 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_14-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0b478ed9c41683b3f1760e4ebdd61341c9ec43b --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ca312e5afd3e5d5d5b8a4788ce03fb7b5575dd9b4355bd3b89d4d17313d2d6 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_15-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed22de8f2a4b39f94025cb53596a97490742a90 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e70b627e2b98d09bec3d793e4a4ee2279e7b06c4e14b8133a1dde721ec11daa +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_16-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c91e22b895e5ae5875c7f633fdc9d9ddeced3d1 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a4d0f11220869d4f99bca91bdae5d648c38b7dab246f95a22b931e531d7a45b +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_17-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad8919055e7a7f2341f5cad881b5dd20d77283e8 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc270ada817df99a0e06285f5d088ef9b14cb2ca5ff70f2f7d1f8dc8cf527cf +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_18-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bc9e3339c59fb31da79f71d0a88ef0da26e8a61 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3415ec9e19c694a3abe3ba3f9d5a6196a8e635e50a3a4b03a2f39e3069150404 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_19-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7a2c42770f3097e38ed386f1f11ada59ba7a7ea --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c9d3a75e7fd37e77d7c985dc82b0c2ea5a7073d8c06a228326bf15762c35d9 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_20-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3517529a1894045e542cae858da7a6afd106dac8 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8999c16f43ed91b211d494dd5b89ac740ccb6d27ac93529977db7ef7e38b4b44 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_21-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba6ac29388fa58392a3d1ce19d5d47518ef4bd08 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d194877ce2a949b6abca96ce5b1af0cb751557ee0726d95a2dd5c0d3927262c8 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_22-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b01b72a2d58b6a5bae82627d44b22153b8870f46 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0802afd9bf8dc22765467346b2fce446574f82a4d39bed82a207cf0c643996c2 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_23-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e493cb84e879123384b3c7040735a8bdaae41214 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f4cf3ac8cd1b80b427a365d1f927d715c72871168bde3790b08145dd53855b +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_24-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30bd55ce13075f2b30ed3c9209274e7351d3d8e2 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6048230a896647d6b1a3b345d730690155b945498493fb5f758b5c4d24ad4bf +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_25-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d36cd9a07201b77f1194f7bceceae6eeac2b171 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790ec982dd74cf55cfa1e3ed1c75c8f797fa92315a209bfd90f5d051de1bff2f +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_26-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f450f5027970b4bccc883b837a092c75e1da0be --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d254e47a115d0e450bf9b3472aa83d5295a4f9eb22f7124b4225e57fc7c60891 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_27-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..679605a744eb505c8f053efd503edf93f2b93301 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925d8cbb5f431b781c157e1a147de1445ce2a42ae0b11337d82f534c4c323de2 +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_28-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7f36e51b85dd855e5b942edff9b75194cc0b07a --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e8d988c1983bfb05cf337e7c42bcd670f521aebe07ccad4fe0acb9bcfd8a01b +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_29-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d145094c57242f788b96b45d8e86aa05697abf36 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79916c35e6ae144bf08259f45eb4415e38c7f0e3ac51fbf0107f463eab733cfb +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_30-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f324ce81f41f313e6d0fbe6a323e80bbd84497b5 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb25657cee313fa9c02d0099e1ce5b5507bdb262752f9a51b6c9d78acd9a782a +size 127466243 diff --git a/2b855b4bc4opt2/global_step78678/layer_32-model_00-model_states.pt b/2b855b4bc4opt2/global_step78678/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..965e741500318aa132cb45f0a1899673ff92c395 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc03496dc40073540eead2ff91a38d1d9505d170487b1656ede0d72a440c009 +size 10435 diff --git a/2b855b4bc4opt2/global_step78678/mp_rank_00_model_states.pt b/2b855b4bc4opt2/global_step78678/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cfbb2dc6a98e63e61959351ae0a959edd7baff7 --- /dev/null +++ b/2b855b4bc4opt2/global_step78678/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:111567b898dbbadc50067802dc1ea14c4e604982dbaf62e1c15bba46ce33ec09 +size 45363 diff --git a/2b855b4bc4opt2/latest b/2b855b4bc4opt2/latest index dd4ed4f46fbdfdfeade5c057e176c669f8c232fa..d443bef48ee1f8d573733591fa6074df5f57673e 100644 --- a/2b855b4bc4opt2/latest +++ b/2b855b4bc4opt2/latest @@ -1 +1 @@ -global_step70858 \ No newline at end of file +global_step78678 \ No newline at end of file diff --git a/2b855b4bc4opt2/sbatch_2b855b4bc4opt3.sh b/2b855b4bc4opt2/sbatch_2b855b4bc4opt3.sh new file mode 100644 index 0000000000000000000000000000000000000000..2338077a314c0ae89b0e5ba8445ac98580e69369 --- /dev/null +++ b/2b855b4bc4opt2/sbatch_2b855b4bc4opt3.sh @@ -0,0 +1,164 @@ +#!/bin/bash +#SBATCH --exclude=nid007571,nid007112,nid006774,nid007502,nid007506,nid007507,nid005145,nid006692,nid007218,nid007123,nid006124,nid006123,nid007496,nid007237,nid006852,nid007206,nid006947,nid007212,nid006977,nid007222,nid005444,nid007219,nid007493,nid007221,nid005300,nid005619,nid006118,nid005203,nid006113,nid006481,nid007077,nid005208,nid005207,nid005879,nid005901 +#SBATCH --nodes=32 +#SBATCH --ntasks-per-node=1 +#SBATCH --cpus-per-task=32 +#SBATCH --mem=256G +#SBATCH -p standard-g +#SBATCH -t 48:00:00 +#SBATCH --gpus-per-node=mi250:8 +#SBATCH --exclusive=user +#SBATCH --hint=nomultithread +#SBATCH --account=project_462000119 +#SBATCH -o logs/%j.out +#SBATCH -e logs/%j.err + +VARIANT=2b855b4bc4opt3 + +# if run without sbatch, invoke here +if [ -z $SLURM_JOB_ID ]; then + mkdir -p logs + sbatch "$0" + exit +fi + +set -euo pipefail + +# symlink logs/latest.out and logs/latest.err +ln -f -s $SLURM_JOB_ID.out logs/latest.out +ln -f -s $SLURM_JOB_ID.err logs/latest.err + +KILL_SWITCH_PATH=kill-switch-$VARIANT +CHECKPOINT_PATH=checkpoints_$VARIANT +TENSORBOARD_PATH=tensorboard_$VARIANT + +# Data +VOCAB_FILE="gpt2/vocab.json" +MERGE_FILE="gpt2/merges.txt" + +TRAIN_DATA_PATH=train4b.txt +# "train: 1.0 0:1 /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_4B_text_document" +VALID_DATA_PATH=val.txt +# "validation: 1.0 0:1 /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +PP_SIZE=1 +TP_SIZE=1 + +MICRO_BATCH_SIZE=2 +GRADIENT_ACCUMULATION_STEPS=1 +WORLD_SIZE=$((SLURM_GPUS_ON_NODE*SLURM_JOB_NUM_NODES)) +GLOBAL_BATCH_SIZE=$((MICRO_BATCH_SIZE*WORLD_SIZE*GRADIENT_ACCUMULATION_STEPS)) + +# Model parameters +source model_params.sh +MODEL_PARAM=("${PARAM_2007M[@]}") +NHIDDEN=${MODEL_PARAM[0]} +FFN_HIDDEN_SIZE=${MODEL_PARAM[1]} +KV_SIZE=${MODEL_PARAM[2]} +NHEADS=${MODEL_PARAM[3]} +NLAYERS=${MODEL_PARAM[4]} +SEQ_LEN=2048 + +echo "Model parameters: d_model $NHIDDEN ffw_size $FFN_HIDDEN_SIZE kv_size $KV_SIZE n_heads $NHEADS n_layers $NLAYERS" + +SAVE_INTERVAL=10000 + +# Tokens: 55000000000 +# -> Samples: 26855469 +# TRAIN_SAMPLES=26_855_469 +TRAIN_SAMPLES=40_283_203 + +OPTIMIZER_ARGS=" \ + --optimizer adam \ + --adam-beta1 0.9 \ + --adam-beta2 0.95 \ + --adam-eps 1e-8 \ + --lr 2e-4 \ + --min-lr 2e-5 \ + --lr-decay-style cosine \ + --lr-decay-samples $TRAIN_SAMPLES \ + --lr-warmup-samples 402_832 \ + --clip-grad 1.0 \ + --weight-decay 1e-1 \ + " + +GPT_ARGS=" \ + --num-layers $NLAYERS \ + --hidden-size $NHIDDEN \ + --num-attention-heads $NHEADS \ + --kv-channels $KV_SIZE \ + --ffn-hidden-size $FFN_HIDDEN_SIZE \ + --seq-length $SEQ_LEN \ + --max-position-embeddings $SEQ_LEN \ + --micro-batch-size $MICRO_BATCH_SIZE \ + --global-batch-size $GLOBAL_BATCH_SIZE \ + --train-samples $TRAIN_SAMPLES \ + --vocab-file $VOCAB_FILE \ + --merge-file $MERGE_FILE \ + --clip-grad 1.0 \ + --kill-switch-path $KILL_SWITCH_PATH \ + --bf16 \ + $OPTIMIZER_ARGS \ + " + +OUTPUT_ARGS=" \ + --log-interval 10 \ + --save-interval $SAVE_INTERVAL \ + --eval-interval 1000 \ + --eval-iters 1 \ + --tensorboard-dir $TENSORBOARD_PATH \ + --tensorboard-queue-size 5 \ + --log-timers-to-tensorboard \ + --log-batch-size-to-tensorboard \ + --log-validation-ppl-to-tensorboard \ + " + +ZERO_STAGE=0 + +mkdir -p ds_configs +DS_CONFIG_PATH="ds_configs/$SLURM_JOB_ID.json" + +cat < $DS_CONFIG_PATH +{ + "train_micro_batch_size_per_gpu": $MICRO_BATCH_SIZE, + "train_batch_size": $GLOBAL_BATCH_SIZE, + "gradient_clipping": 1.0, + "zero_optimization": { + "stage": $ZERO_STAGE + }, + "bf16": { + "enabled": true + }, + "steps_per_print": 2000, + "wall_clock_breakdown": false +} +EOF + +DEEPSPEED_ARGS=" \ + --deepspeed \ + --deepspeed_config $DS_CONFIG_PATH \ + --zero-stage $ZERO_STAGE \ + " + +CMD=" \ + Megatron-DeepSpeed/pretrain_gpt.py \ + --tensor-model-parallel-size $TP_SIZE \ + --pipeline-model-parallel-size $PP_SIZE \ + $GPT_ARGS \ + $OUTPUT_ARGS \ + --save $CHECKPOINT_PATH \ + --load $CHECKPOINT_PATH \ + --train-weighted-split-paths-path $TRAIN_DATA_PATH \ + --valid-weighted-split-paths-path $VALID_DATA_PATH \ + --data-impl mmap \ + $DEEPSPEED_ARGS \ + " + +echo $CMD + +echo "START $SLURM_JOBID: $(date)" + +# bash launch_srun.sh $CMD +srun --label launch.sh $CMD + +echo "END $SLURM_JOBID: $(date)" diff --git a/2b855b4bc4opt2/sbatch_2b855b4bc4opt3val.sh b/2b855b4bc4opt2/sbatch_2b855b4bc4opt3val.sh new file mode 100644 index 0000000000000000000000000000000000000000..817d4c667464fd144a9413bcd63a1f9c192dd59b --- /dev/null +++ b/2b855b4bc4opt2/sbatch_2b855b4bc4opt3val.sh @@ -0,0 +1,168 @@ +#!/bin/bash +#SBATCH --exclude=nid007571,nid007112,nid006774,nid007502,nid007506,nid007507,nid005145,nid006692,nid007218,nid007123,nid006124,nid006123,nid007496,nid007237,nid006852,nid007206,nid006947,nid007212,nid006977,nid007222,nid005444,nid007219,nid007493,nid007221,nid005300,nid005619,nid006118,nid005203,nid006113,nid006481,nid007077,nid005208,nid005207,nid005879,nid005901 +#SBATCH --nodes=32 +#SBATCH --ntasks-per-node=1 +#SBATCH --cpus-per-task=32 +#SBATCH --mem=256G +#SBATCH -p standard-g +#SBATCH -t 48:00:00 +#SBATCH --gpus-per-node=mi250:8 +#SBATCH --exclusive=user +#SBATCH --hint=nomultithread +#SBATCH --account=project_462000119 +#SBATCH -o logs/%j.out +#SBATCH -e logs/%j.err + +VARIANT=2b855b4bc4opt3val +VARIANT_CKPT=lm1-2b8-55b-c4-repetitions/2b855b4bc4opt3 + +# if run without sbatch, invoke here +if [ -z $SLURM_JOB_ID ]; then + mkdir -p logs + sbatch "$0" + exit +fi + +set -euo pipefail + +# symlink logs/latest.out and logs/latest.err +ln -f -s $SLURM_JOB_ID.out logs/latest.out +ln -f -s $SLURM_JOB_ID.err logs/latest.err + +KILL_SWITCH_PATH=kill-switch-$VARIANT +CHECKPOINT_PATH=$VARIANT_CKPT +TENSORBOARD_PATH=tensorboard_$VARIANT + +# Data +VOCAB_FILE="gpt2/vocab.json" +MERGE_FILE="gpt2/merges.txt" +#DATA_PATH="/scratch/project_462000119/data/pile/megatron_data/meg-gpt2_pile_text_document" +TRAIN_DATA_PATH=train1b5.txt +# "train: 1.0 0:1 /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_12B_text_document" +VALID_DATA_PATH=val.txt +# "validation: 1.0 0:1 /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +PP_SIZE=1 +TP_SIZE=1 + +MICRO_BATCH_SIZE=2 +GRADIENT_ACCUMULATION_STEPS=1 +WORLD_SIZE=$((SLURM_GPUS_ON_NODE*SLURM_JOB_NUM_NODES)) +GLOBAL_BATCH_SIZE=$((MICRO_BATCH_SIZE*WORLD_SIZE*GRADIENT_ACCUMULATION_STEPS)) + +# Model parameters +source model_params.sh +MODEL_PARAM=("${PARAM_2007M[@]}") +NHIDDEN=${MODEL_PARAM[0]} +FFN_HIDDEN_SIZE=${MODEL_PARAM[1]} +KV_SIZE=${MODEL_PARAM[2]} +NHEADS=${MODEL_PARAM[3]} +NLAYERS=${MODEL_PARAM[4]} +SEQ_LEN=2048 + +echo "Model parameters: d_model $NHIDDEN ffw_size $FFN_HIDDEN_SIZE kv_size $KV_SIZE n_heads $NHEADS n_layers $NLAYERS" + +SAVE_INTERVAL=1000 + +# Tokens: 35546190000 +# -> Samples: 17356538 +TRAIN_SAMPLES=1 + +OPTIMIZER_ARGS=" \ + --optimizer adam \ + --adam-beta1 0.9 \ + --adam-beta2 0.999 \ + --adam-eps 1e-8 \ + --lr 2e-4 \ + --min-lr 2e-5 \ + --lr-decay-style cosine \ + --lr-decay-samples $TRAIN_SAMPLES \ + --lr-warmup-samples 0 \ + --clip-grad 1.0 \ + --weight-decay 1e-1 \ + --override-lr-scheduler \ + --reset-progress \ + --no-load-optim \ + " + +GPT_ARGS=" \ + --num-layers $NLAYERS \ + --hidden-size $NHIDDEN \ + --num-attention-heads $NHEADS \ + --kv-channels $KV_SIZE \ + --ffn-hidden-size $FFN_HIDDEN_SIZE \ + --seq-length $SEQ_LEN \ + --max-position-embeddings $SEQ_LEN \ + --micro-batch-size $MICRO_BATCH_SIZE \ + --global-batch-size $GLOBAL_BATCH_SIZE \ + --train-samples $TRAIN_SAMPLES \ + --vocab-file $VOCAB_FILE \ + --merge-file $MERGE_FILE \ + --clip-grad 1.0 \ + --kill-switch-path $KILL_SWITCH_PATH \ + --bf16 \ + $OPTIMIZER_ARGS \ + " + +OUTPUT_ARGS=" \ + --log-interval 10 \ + --save-interval $SAVE_INTERVAL \ + --eval-interval 1 \ + --eval-iters 100 \ + --eval-only true \ + --tensorboard-dir $TENSORBOARD_PATH \ + --tensorboard-queue-size 5 \ + --log-timers-to-tensorboard \ + --log-batch-size-to-tensorboard \ + --log-validation-ppl-to-tensorboard \ + " + +ZERO_STAGE=0 + +mkdir -p ds_configs +DS_CONFIG_PATH="ds_configs/$SLURM_JOB_ID.json" + +cat < $DS_CONFIG_PATH +{ + "train_micro_batch_size_per_gpu": $MICRO_BATCH_SIZE, + "train_batch_size": $GLOBAL_BATCH_SIZE, + "gradient_clipping": 1.0, + "zero_optimization": { + "stage": $ZERO_STAGE + }, + "bf16": { + "enabled": true + }, + "steps_per_print": 2000, + "wall_clock_breakdown": false +} +EOF + +DEEPSPEED_ARGS=" \ + --deepspeed \ + --deepspeed_config $DS_CONFIG_PATH \ + --zero-stage $ZERO_STAGE \ + " + +CMD=" \ + Megatron-DeepSpeed/pretrain_gpt.py \ + --tensor-model-parallel-size $TP_SIZE \ + --pipeline-model-parallel-size $PP_SIZE \ + $GPT_ARGS \ + $OUTPUT_ARGS \ + --save $CHECKPOINT_PATH \ + --load $CHECKPOINT_PATH \ + --train-weighted-split-paths-path $TRAIN_DATA_PATH \ + --valid-weighted-split-paths-path $VALID_DATA_PATH \ + --data-impl mmap \ + $DEEPSPEED_ARGS \ + " + +echo $CMD + +echo "START $SLURM_JOBID: $(date)" + +# bash launch_srun_32.sh $CMD +srun --label launch.sh $CMD + +echo "END $SLURM_JOBID: $(date)" diff --git a/2b855b4bc4opt2/tensorboard_2b855b4bc4opt3/events.out.tfevents.1683799351.nid005754.102211.0 b/2b855b4bc4opt2/tensorboard_2b855b4bc4opt3/events.out.tfevents.1683799351.nid005754.102211.0 new file mode 100644 index 0000000000000000000000000000000000000000..e55001ddcd109142861149b18714f3a7d27445c6 --- /dev/null +++ b/2b855b4bc4opt2/tensorboard_2b855b4bc4opt3/events.out.tfevents.1683799351.nid005754.102211.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d92261447397b10c1a287f395ef19bf70a75378b99a8edd0429d8e5144c1e5 +size 141088178 diff --git a/2b855b4bc4opt2/tensorboard_2b855b4bc4opt3val/events.out.tfevents.1683928725.nid007239.70324.0 b/2b855b4bc4opt2/tensorboard_2b855b4bc4opt3val/events.out.tfevents.1683928725.nid007239.70324.0 new file mode 100644 index 0000000000000000000000000000000000000000..d71f71ab29658940f3ab2290dbd08c456d9d5f91 --- /dev/null +++ b/2b855b4bc4opt2/tensorboard_2b855b4bc4opt3val/events.out.tfevents.1683928725.nid007239.70324.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a2418c2e9f59a97ac1191ba12550108f89bd1e2a3ae70ecb472b79e2e46e199 +size 980 diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt rename to 2b855b4bc4subopt/global_step80064/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_01-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_01-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_01-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_01-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_03-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_03-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_03-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_03-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_04-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_04-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_04-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_04-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_05-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_05-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_05-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_05-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_06-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_06-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_06-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_06-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_07-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_07-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_07-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_07-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_08-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_08-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_08-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_08-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_09-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_09-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_09-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_09-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_10-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_10-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_10-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_10-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_11-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_11-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_11-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_11-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_12-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_12-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_12-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_12-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_13-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_13-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_13-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_13-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_14-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_14-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_14-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_14-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_15-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_15-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_15-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_15-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_16-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_16-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_16-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_16-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_17-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_17-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_17-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_17-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_18-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_18-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_18-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_18-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_19-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_19-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_19-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_19-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_20-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_20-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_20-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_20-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_21-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_21-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_21-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_21-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_22-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_22-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_22-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_22-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_23-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_23-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_23-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_23-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_24-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_24-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_24-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_24-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_25-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_25-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_25-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_25-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_26-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_26-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_26-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_26-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_27-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_27-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_27-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_27-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_28-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_28-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_28-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_28-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_29-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_29-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_29-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_29-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_30-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_30-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_30-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_30-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/layer_32-model_00-model_states.pt b/2b855b4bc4subopt/global_step80064/layer_32-model_00-model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/layer_32-model_00-model_states.pt rename to 2b855b4bc4subopt/global_step80064/layer_32-model_00-model_states.pt diff --git a/2b855b4bc4opt/global_step80064/mp_rank_00_model_states.pt b/2b855b4bc4subopt/global_step80064/mp_rank_00_model_states.pt similarity index 100% rename from 2b855b4bc4opt/global_step80064/mp_rank_00_model_states.pt rename to 2b855b4bc4subopt/global_step80064/mp_rank_00_model_states.pt diff --git a/2b855b4bc4opt/latest b/2b855b4bc4subopt/latest similarity index 100% rename from 2b855b4bc4opt/latest rename to 2b855b4bc4subopt/latest diff --git a/2b855b4bc4opt/sbatch_2b855b4bc4opt.sh b/2b855b4bc4subopt/sbatch_2b855b4bc4opt.sh similarity index 100% rename from 2b855b4bc4opt/sbatch_2b855b4bc4opt.sh rename to 2b855b4bc4subopt/sbatch_2b855b4bc4opt.sh diff --git a/2b855b4bc4opt/sbatch_2b855b4bc4optval.sh b/2b855b4bc4subopt/sbatch_2b855b4bc4optval.sh similarity index 100% rename from 2b855b4bc4opt/sbatch_2b855b4bc4optval.sh rename to 2b855b4bc4subopt/sbatch_2b855b4bc4optval.sh diff --git a/2b855b4bc4opt/tensorboard_2b855b4bc4opt/events.out.tfevents.1683213095.nid005063.70163.0 b/2b855b4bc4subopt/tensorboard_2b855b4bc4opt/events.out.tfevents.1683213095.nid005063.70163.0 similarity index 100% rename from 2b855b4bc4opt/tensorboard_2b855b4bc4opt/events.out.tfevents.1683213095.nid005063.70163.0 rename to 2b855b4bc4subopt/tensorboard_2b855b4bc4opt/events.out.tfevents.1683213095.nid005063.70163.0 diff --git a/2b855b4bc4opt/tensorboard_2b855b4bc4optval/events.out.tfevents.1683366796.nid006401.21904.0 b/2b855b4bc4subopt/tensorboard_2b855b4bc4optval/events.out.tfevents.1683366796.nid006401.21904.0 similarity index 100% rename from 2b855b4bc4opt/tensorboard_2b855b4bc4optval/events.out.tfevents.1683366796.nid006401.21904.0 rename to 2b855b4bc4subopt/tensorboard_2b855b4bc4optval/events.out.tfevents.1683366796.nid006401.21904.0 diff --git a/2b855b4bc4opt/tensorboard_2b855b4bc4optval/events.out.tfevents.1683367486.nid006518.105000.0 b/2b855b4bc4subopt/tensorboard_2b855b4bc4optval/events.out.tfevents.1683367486.nid006518.105000.0 similarity index 100% rename from 2b855b4bc4opt/tensorboard_2b855b4bc4optval/events.out.tfevents.1683367486.nid006518.105000.0 rename to 2b855b4bc4subopt/tensorboard_2b855b4bc4optval/events.out.tfevents.1683367486.nid006518.105000.0 diff --git a/2b855b9bc4opt2/3474587.err b/2b855b9bc4opt/3474587.err similarity index 100% rename from 2b855b9bc4opt2/3474587.err rename to 2b855b9bc4opt/3474587.err diff --git a/2b855b9bc4opt2/3474587.out b/2b855b9bc4opt/3474587.out similarity index 100% rename from 2b855b9bc4opt2/3474587.out rename to 2b855b9bc4opt/3474587.out diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt index b6d0a5a034ed2ad9292f466e1a227483bb00bd46..5789bfb4fb22dbcd5adcf32b6d579127ad3da6a9 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:faa982714e04e5173879d7e8907ca1f82bd8bda22ab3541fbebca64843af2ed9 -size 89305623 +oid sha256:3e575cb7fa963f33b362e8aaa0c37a4f72cbde4e33d964804793a007638ca99f +size 102174039 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt index 7d54e663d5839b57a166d0f08b30f7f2e5ad3524..7fcedfbc0388fe7957917e1ce42b97182b63fc17 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0b5f835ddb51519dc74cf17a0c8b0adf6a13a454f3ed3362f51b7261fe30c9c1 -size 89305709 +oid sha256:2d5b3b6c942def0943a85051d75fcb0059eaf1d3e74134ef4c3323eb1c860a22 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt index 6971eb008dc154281bfb3d25c4ee38f5a3273be8..0777acbb84e78a5551cd3f2b79093b73a891f851 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:12a0a83e4198056491dc9f390fe0a146c6e9f74a01911f5780ddd8dc733424d2 -size 89305773 +oid sha256:8c3dc5b70c4428cbad46bb2a237995dba4ae2b0ff1a7af68bf8882725dad1fd2 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt index 7b6828f65f5d30c06d80037e475894a81a995c19..c9572c4ab1d5848fd3d3783d7be0e4767c839afe 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ee501b7625c1351def5566ad8b547da1ef61ff44f42ebe3917e2ca3d84198d74 -size 89305645 +oid sha256:0e65abfca8f914d559e6f5d72397bda9c0fdea79b48d745e6fbecb7c7b819bb0 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt index 70d34fc9202b822d873692ecdafd272ee04ca807..c1be572f1204680948f531cd363e742675767d61 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a4facf9909cfafd454afb769cd28e5f11f6f1fee7d905fb337409d35edc0c3a8 -size 89305645 +oid sha256:2ad043c99471b4c22b99167dca623f5a74ac11c2c755ebf996fc6e572beeee7a +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt index e930159fbc247ac7a52908cc09fd5d295c1e6158..e2ffe4684f2e6665a7a60888653fe59b0f8f1931 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b1b185f72bae9093e5d06dc752907249620fbb0c660d2d4718c1f6cf070141ab -size 89305709 +oid sha256:d91c116dc1c49b9917423b60698109c056b75509c2b7dcb35186e12e755fc21b +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt index 90d86206aff05a8a6348705fe3697c47dcf4a1f0..8eab94295e6e358d49445bf56f3b2de328a96cbe 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:42d340a0d466b46658e6c1c58074125ad6ba2dc75078c279ef7848c4db5fe543 -size 89305645 +oid sha256:0b621b138ee9744d7cc2158d3121e91d4254c0468748db965e0d8df36bd32935 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt index 7c9983dbb320e8473c099a6e2f19cc76a52d4a0f..e69bd79fa88afcc653d8cbea4f718508229bdaab 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:477f26b4ea4ab89ae40dee458e5927e1e2ab3e49dd378f6f037463cc74531099 -size 89305581 +oid sha256:12d5b613165db85fe6b0fbb691cebee38d866ea9e21efa3ebe657237423c058d +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt index ddd900c8fe7edb0c61edef90191d0adf2f5d06f3..1e653b517792eefff04596677fb9a2af413cf17a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:58b738a315ef272521f5a7552286a28aa3873a34b49cc9a702f3d1bf4bc6901d -size 89305709 +oid sha256:6cce636c34df252cc268b09bbdd047a3284c48d5e12b5888deab429d530b009d +size 102174189 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt index fcc5e5142f7e6c9b0c4c2c3cea5294351c8b9fff..aecee0b18c7a5a7a568b484b3fd2f565b8d4d2d7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:217c7a1222c45aaaf5bb7ee06d631c898fdb94084616eff3dba48af4611c2bc5 -size 89305645 +oid sha256:30fe78336f267a83c6a09d8f2046c6dce2fcba53c75532465a337df062d6b679 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt index b91212a7b8c1e4dc50e161ff97e7fcfc323d4b87..1a8bed45594e9f28804d979d4860e0183a7b2dc7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fb437d115f5350e1a1d03ef244412a54f02079808b7431b464227a4b58f7cb77 -size 89305645 +oid sha256:12ef6ee6f073dbe81effe71c38938e7c5a480484231e33b661582dd4ae83e8bd +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt index 106c014f501b1008fb888b51370480572e902b8f..a430d8520d898a2b606374eaf775bedda8dad414 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:adf6537f9b0f3e1d13faab510277b43022217244cdd05ff6ce3e2880536f5a6d -size 89305698 +oid sha256:0c1490da4d798720d8952574a91c5a25dc47440fe4597e14f5ece51e28bf467b +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt index ed9dacd71074c4fb9b0bef8ed173529343d9b38e..c1fccece2ef24b927e665593c3389771740904a4 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ada8c88b95c2ead1a001e5571aa82888dbb0997a4fa88bfda97f821fd8a97f72 -size 89305645 +oid sha256:b43f4cd96c95fedbfadce7114969999d134aec9136d6dcc58b77ace11ff0797f +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt index db56915a03ef4a4c305c07e6f93b7c1919815416..3267cf2afbf2251c466ce8bb4d46af886e6732b9 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:32aac13996654507d50d338cd6839bfb2845455fb366d178d3a6084f32a6559e -size 89305581 +oid sha256:d6443eb6c33a68f2f3ec07e95006897585cbdb851957949bdf33f3d1243fe967 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt index 2022e3dee1fd573a05c0c76a479715512f9646af..671e2e55a25170a5528774a090d89d4578488104 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b676e5eb8448aad6754e2de0a544cda191d8c2f5d1d5519cdf6e1356ab683d9a -size 89305645 +oid sha256:d7de1c74913b1d219e2ae46b2410b07c1bbb52d25aa9434c578afec1494fa73b +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt index 8d9f9f6d593d34fc94a5ff7f505d567ceb09c4bc..48a39e075bc67c2552482551f95eea0784664a41 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:358b839a65eedf64a2c5cf1939fa0ca6ff83fcaef26c4f360fae9d80eb49f284 -size 89305773 +oid sha256:db4d611325f4818dc6464f9def09187322f0f1f3cebe3ca4ab05a23adb84a1b7 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt index 0d887505a2ab6e3fdc489b2bd49b7533573fcd5a..cf6411a7c9637ea92ac9285e25a54dfa8e51ac7a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f300e532f53f6010f8811e93f38511eaa779f66692aa0ef7b6d156b54df58d3 -size 89305709 +oid sha256:9b7dfbe1a70526e1b48c0149189918653d5452304ab17af497b0ec3e808ea623 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt index 46b71a736fda324f107a2ee885546c07ed4bebe0..47912f4d3a802adea2e922e7356540615ed8b24b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ad47b2b1b2cddf6a7a46c7870f89e99988ec09eb956ee9bffed6651648e7f2a1 -size 89305581 +oid sha256:0828ec100d51bc12e2f3fe28a834c1f74aa333a17def29414f369b8100f23a7c +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt index 9c9a58720ca6b081ed9c00b67b589901d0eeed8c..f203fa93ce221f8987d9530e13d62497c12e5f23 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:85eb9f57e162b564ee93bf8ff0e7e54d6cbd11498b8336c19a2b831d2e115c57 -size 89305581 +oid sha256:758cc6d22fa4adca0778e360fc351fbf40528d2822a6c79d8506d656fca1edac +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt index 1fbddd4406498729a14fe1aa03ca5e0c06ebf688..9b85545c6403ddb9363174470e787f171182a6d1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d2134b5efa561efb8e25a45dae2988a0cbad71a9bf1f17073848b2fda3d74664 -size 89305773 +oid sha256:6573591981c16fdcd87d9749b563274f8b2b995c808daa00edac1e15aa48b3f6 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt index daea4e53122300e1b347865c5f7ef1622bb3a932..9e8f6cd5154db82db5c65c7eb7d80a428e0853bb 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dfce8f40c119da3f4a3db19b562ef44645e2dc0e725382dda629c1954243a393 -size 89305709 +oid sha256:2f6fd6664d2edd72160968315e2431db34f708675b1fcaec5e3a7947725f03c0 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt index e3bcc4438f9b186afd64392dcf76611def352505..b6c1930d975d6843f30d72d45954c1b1b55bd224 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cafac3192e7ec28b9e1c9cbb16f0c1a1676f62cb83601b36e64c45e342da6758 -size 89305709 +oid sha256:76bf5a9dd88a132beae5c6170cf3c3797b20fa9b8413309c2297a8efa5aefb75 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt index 82c7216af55e573b54bd4edb309525e094f01834..f61fb932a148430505f92bf79e13b1d35fdad70c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:48b57cbfa2d1e4e9019b0f5aef558e24c0b1e00053570e6a28220f0886bea8d3 -size 89305634 +oid sha256:5fced28298efcb7410f5e31ad9da287f68768e9c69ae1b6a255d3968cff0005d +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt index e5c804bd8d963cfda03eb721bf93558c703849f4..035dcb992002cf9d9329f36ae37f54391eddc5d1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5b6b96b9ed2abd074e83adb8ef0fa83d11afa4d1c986e35e38641b78bfdc8718 -size 89305581 +oid sha256:bc1f9732474ae1462968f19bcb30365d6adc968e168b21ea0ba33ed71d29da24 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt index 8299c356d1600cbb478f9016e7dda09bc65d08f0..6953b8d7241d718fa92f2992f1619d341096163b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ebfef188ed0e153d6e4ae9739d13bec6675054d9e14d3bb47a460fcb53b773c -size 89305645 +oid sha256:785602ae9978402b3821d6c87dc3903486dc5142371e654c3fc60d20e16f323d +size 102174189 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt index 24b423a0abe90f488bfa3ff39bc39867b2b936ba..aa38c3d902a7d91eb855e99f94da6701cb900c97 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9d068a4414e726d8cf79bebdda996a1dd4e819467f73f69e2d688306aaad9139 -size 89305645 +oid sha256:6b35a4e0d3d2914bf2a32281623091f655270e5dddfbdbef77e1e415adc32c73 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt index 3ed400eb464ae2fffc94eb85f27e5460c5ae08a3..4997c4f25f311b012d216c51cdf5294796ed29bf 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e8e116d13767137bb8977c40b95b59d585db7cbd13fe772aeeebc0c0ea9143a5 -size 89305709 +oid sha256:737377e404292d59a7df79c3811678cf82f2b10c112c7f9b861844e9bc32cf9c +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt index e580fe7618c7d0ec93998bff8fb73795b7188519..bbc39b0f7189bdd8d1f66035e322e253fedd46b9 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:086a3013c2f19608b5193c2f8e2c3f7d16c2f0ee19819723beca3a0a90cf8205 -size 89305645 +oid sha256:b55cd4040cab07fea0d426ac76086a52998101b45c8ca392b78eeb347d222de0 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt index 9fffd661614b863594943d33a7fd94e2699a2fc9..3cfcfeda039838feb80cb89d007538004bc357ef 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a446d582db1b2dfda4e2155a229434884ed04ef542e53e84642d63be9a020cdf -size 89305645 +oid sha256:cdcb6a73be0050be09e4bf8b3cd299d9d7ca79804a1d91e61691f0667cd47011 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt index e49b0166f9a202de6c785edd600efbbdd82eff37..5193720d07a1d2745754edbd85744ecb3570c6d8 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7ad714ca79fe8e3f83afa4772c27572b74d3c01992392d53343e71066447569 -size 89305645 +oid sha256:7ef16527255ae855934b52a374d99fad5c83c559ba8f1f8f051ccbc747507946 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt index ecd6579dff88b5e2eb91a9772cb31879e487f7c5..02f71ae68e2f757ca0ab5b360d4d838607eec897 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:24684b3e40033ed67d46da85089a53eb9014b06fafc9f5231493e05f684ec72c -size 89305645 +oid sha256:1b88859329c941f2b82cb8ce4817d082ff61d35e2cb68983ef02716277990a20 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt index a4dac505df05b237644aa67bcdf6eac591268cc7..b1af5da7c5eff63bddab0d5135641a7f8083019c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:73b9d4928e58024332d18f6c01c793b342f84bc81de7c7755c8e7808f0b107ac -size 89305645 +oid sha256:1628d2e0d3addb02371918fa069e71b16cc1d8b84664dcea99d97e27bf290b51 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt index e5dc35c92d823015380fef9a3976335ac2b04868..4359722588998f71baf0133a24e3792a8984ed4d 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:23bbcddb4b55bd57a3b6859c6cc0314dcaf59da2c749721cab5d66609c73c247 -size 89305645 +oid sha256:3288fedfe468b05e9a27a13cfa6583984236549dfaeda4f025d155c6a93602b3 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt index e9e4ae4207ce022717f4e800fd3e94fd99048964..cfb6b82b6243c09241dbd00223802324dcd54490 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:31567a5c83be86be4856e312771aecde609ba288d38a6c3f097cf5e8fdf48564 -size 89305634 +oid sha256:65b36021436e4a7752b67611b633e4778a399a33d7d1bcb10f35cdf411f204d7 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt index 0e916ad54d72cbbf4bb980a7fab44af6b9960ddf..0c5712abd103d57ac8c7f306d8b5367fffe1aa21 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3469cc56e844878ec3cb2b1961790ff803c15e12cd67d7e3f8bbdb02c6b83ebf -size 89305709 +oid sha256:7fd379f2c76cc2dc40c03e2445cef616ac6022efd56078da85dda560f63f4cc3 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt index 7ce481abc8683e8684db818542d41385d1d5aaad..531208ff2af03acca0be76e3f37cfd835e50bb71 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:850534ef5644fffa718e451aacaf4321543b1c42b4d7a5db143233aa05741d88 -size 89305645 +oid sha256:221aa370475aec63c56418be36cebbdc6e2b11e9bc13aa5605e9d880afffe374 +size 102174189 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt index da623984484826742ec80478c77e0b9e88ec4e06..59a08baaa0cb58b4e5b5d9c0cd036afea1669266 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:224fbe0f94eb1d3a87671c4d663744149966a31f8e70b913300a636e5f824d98 -size 89305709 +oid sha256:59233492d3c83205dfaef9923377309a5e9cb0cbebb38ed9462c57f5ccd680e0 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt index dfc84c357bd9054b5a90c538e5d269b5d9b34b0f..afb078780193c5703fe106dd7d7b4b9bbf29c2e7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f31fa73eb077296d108ac495f08613c70c020a27948c443f69b79aefcf6af28e -size 89305645 +oid sha256:6d85d8a95a521c8b061c6fad96b934b6eafcfdedee8f261274c6df1e8e6340a6 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt index b33a15a80268632d31aeb2d23782484892b6a35a..be2a59ebc4b065451ca8af9c91e417391dbb663a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f10e69448e1e9603afdb4d4793c4168ee6e4ee63f8a2518e5ade366e0c72a46e -size 89305581 +oid sha256:90d579f4c42e1475c3203f285610bd6f5c822b89fa52749261da870c06aad747 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt index 088e3c59e0f9268ed21e1cf88c59047274873fa3..8e735181808f405c30034c7ce7ebad2cdfdd4b5c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8dcf8d97144c5a5b7cca517192dde0592e5e2d632bc2c511f75e3e51623c80b4 -size 89305773 +oid sha256:41bd376bebe1b75373c3192f86dd49a862e049cc10b02f194f3c456cfb691937 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt index 3132a1cca69bcb83551cb8a6b0c4b6f0766d9d48..f3320ec6f1f5ed87c8e2ee1030e8b33d9a6b0dbd 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:577173d8652361137b08728d04f1856026d79ef1d2dc9b187a3157ada4be280f -size 89305709 +oid sha256:d9131462a28f2e58a1739ad5d21b58ba227ffbf292b0edf2c0443ba96a374a99 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt index 823aa95984bfbe9628a59aee4c26069c4b125975..d935d7837cdaa03a529e1afff69f3f5689f5e6ba 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9b1e8ecc4f9cfac56e5a471b483859e797b2dd7951b84578bcb42fade6c23b13 -size 89305709 +oid sha256:e1220e0d38fa67be82b865f2dec7dd11bc2699957e89dbb40a949578fbed1cf6 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt index fd293f3c5fe7ce901f44f741f5cd937ae363322d..58edbe4186699fc13817025e15e6a4efd2bd8839 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:103468c2c541bb702750bd677e7ce1dce94e9fa620f660d5bb25217d86b5b95e -size 89305581 +oid sha256:7eec228ff48b40161fcbec64a4cadff1116747728da2330eb59f70724a9a3282 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt index f1d03f4f40214230c4ff0fd10c804de3b9dd1bb8..77cf29bfdfa9d2a1fdffd469300fa0c707259bab 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0fbfc7aee194e50cc3925a349e14c8f33cbb354572625af123b089f730857be1 -size 89305645 +oid sha256:4ac14891430dbaba79dde73976f1a1f0583730cee4cc2b39cfb9582c7cf95f4e +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt index e4a18f47b00c6a419329064b51343bfc648e634a..524db46ba65d9947da33f9ac0380cc6ae9fe0a6c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1105a7a4aa85d2dd8fa0faae0c89497717143a02972983651ad2849562f39675 -size 89305698 +oid sha256:9c622a0d3bbc86d17ddf3165935b34b6dd7588b5646c13effc38f1bcc3d5b260 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt index 8156a650a6af3d5bcc1d36e4b497109739004260..c1ad7611e495de13ea67854c72da72998e4a08a1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cfdb83d2082dce61d301792ce948124e133b3ca650435d9f10488c2412bbd155 -size 89305709 +oid sha256:c1e1ebe5c2c89c64cea24a69f232d8361d7b3a7a165bce28e751319d77488da3 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt index c26efba873c2953169dfc5b6754001bf637ca515..64823b407c38559814c9ce7e47f40e0d3bfe4671 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:016a621d16a426d8b770fcc8e02e1f18da370268c83caa719c29bb108a6b324e -size 89305709 +oid sha256:3be56b1725755e2460caac77da6aec7f136482f44903b54cab74080ac761f9e3 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt index bda372b5884e9389bf57dc924d800df1d20a30f2..c4059199770b39f0c0a1c275925fd0a6dc246a98 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6eb910722e2cf80349cfc962ee6fb1aae09c05e9ad97e93ccc08d6ef85ff4bc6 -size 89305645 +oid sha256:125d99c194b7bf50640de485ba983431cfce9c9c13d91fb73af9c7136ecec21d +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt index 04cbd6dc8e696a9bb553ba3148c92e3a25f66d72..aee324ab383b3d6b5932db5f6fdc26d469ca5276 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:00210461940f5e4b72d3074f907c43481ecc190556fccf358d1dd36f25895122 -size 89305581 +oid sha256:02321ef48ba2ffe5d27345a2322b38998fafa75641c062e4e77c8bcea68368df +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt index 93efa02b49fb034672bc7b4edb6500aac6093029..78d0790b8675133c61d1cc56dabe8e27c95e0ff5 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:425ecb2b8993f16e4653f8877bee23b6a917b2a453f1933cad1f6a7024a2162d -size 89305645 +oid sha256:bf8a58885da06b80c2beeb7e46f7154315eda833f0bdbddf5d0f7f962b9c4f49 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt index 6299c3e92be1814d15c240fe8aa4a453075e729c..00e54cc0fd48813cce5b95214920531ec0f2368f 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e9f39cf4958082e8deef13add6914ca67e399572a5a0bf04366843b5d8032a73 -size 89305645 +oid sha256:4c320eb9166625d644ff642df4ecd88ae20570a65a55970ddbd2bf90f86cfa6a +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt index 8dd6ced57b2b47535824aa36d3a9eb250ab36286..122b1ccf04a4b55ccc2b1383bc207d59974800b1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:086955551bf20a1304a9c9d20ce3b995bf3650643b555a419a1fff6453bf3076 -size 89305773 +oid sha256:e59da7973f335a864d699defcfb5187befa553fa004b3589038f29f4a60bb9e6 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt index 0b1867361e13d5bb89bacc22ac97b72e869ae15e..61d6f8090d70cd9e7a8f79fe413790773c363a33 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c5a2423898d41be51e5dea433edebe929055154ab326171c783b6458f3329bac -size 89305581 +oid sha256:7261e232175dbf3eedeec6c33eb212d28cee1a16a7d8ee7c122e297893877fe8 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt index b0e67d4c5f243ba94551cea763a69bf60b008806..4475a352db475f99eb5422c73a0bfd1f7960d31b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:48a3e5581ed975bffd39297951e54855869bdc011870df67eb526cb511accfb0 -size 89305709 +oid sha256:f37884cd8a61f623ea50f68194fb73f3fd1c12471d3c82fac235a9e21698fe54 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt index 1c71af5b4bd810b6a07e2da9f75ec44e61e3ba63..6ccc283bfd27fc95e37ef7c56e6a33c3921fc6af 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:02852e83868c70f30800dea0349dbe97bfd87672eb9b43b804342cca1e38f276 -size 89305645 +oid sha256:e9ea910292d70551aa3832b9782937f59e90bb6b868df6b81c6e6564a5b6b4ca +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt index ea04009a009657bc14ed6d71dceb0a659fe915cd..b9a39fde2d4825e5cc3ee8151e3f86dc325d6744 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9e83a8f3ed12593ae3fdcb12a6d4e493610ee371d432d06fa3ad4d9c67c6e5a5 -size 89305634 +oid sha256:6524d0cc4c4fdec0b147ea24e91eae9267ec3d93746bb297b725481317d03756 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt index aa2b3f4153810fd1a39e1ee6eefa8cb211b8b3f2..d58dd5fbe6a6f815bcca98db417e0a6ab5bb8573 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fc620b4fc19c85a365f482708c3bb5215be7f6eceee37fd75a74c51f56c4dfcf -size 89305709 +oid sha256:c20427c6f6fce3ee389cca34ed316f1fc0176ece849c639ddb92c6efc35cd730 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt index 914c0731678a99d7879acd73426476550ec461a9..6853ea3092b5ce261ab880e8536fc36518bb4d62 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:969bacc14456b8d6a08f415375f54f07b9f7e157df5435bfd96ded5a344beae0 -size 89305709 +oid sha256:e12e46b8566933b387300aaea50ca233b9a5f897ed2c2042104d9c5bcb1b1578 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt index 8b4ee3234afd6849148ecdc7928d59072a49f7f1..f872f3c8aac1147021ca7234671e264928be2b33 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:61bceca2c797fe205fb12f5deb639f5bf3f2bb8cf70a2d715410e8048401c0a0 -size 89305581 +oid sha256:4e36c16f53707f18d23baf3d4fb42f3ede670a1a4c426caeb5c918de6149f0b8 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt index 166bed7fc1045127b037a12e69c17d0a62a43a61..ef389a26ebd3e3f61650c23060050132da42e64d 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f7c154ef803a63274b7cb8d5a2fee9743013776fa4090d89c4bbf418af104afd -size 89305709 +oid sha256:e56bedda086a061331b95d817e73396f2cdbc0d1e1a09ca321fd7361bf2d236e +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt index fc0cf2faf98df6c4ee87e27e30536b515b1d7e4b..f83a6a9b6fa709b533a528d6b9a736d33a84ee96 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b7727fb351a5dc48558ef9d92bbe4160f81b2caa5053e377ed5412e3f21b4883 -size 89305709 +oid sha256:0f18bb8dc7c3a7c56319c4176c4e815bd017a4418629e2f9f9a2388d489d978e +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt index 6e56fe4742f442face7302710889fce4fdf9992d..e32ad129dc4a7cadff67dbf48afccb323323c350 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9e0571011c16af6c33cdcaf7c93796451a5bc2e7c6f9a9af5b3c3708e0eb8cbb -size 89305709 +oid sha256:3709b788f158a33c92c70864738c7de61ab811e656aa577559577f000e63bc38 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt index c6a360ed7cf3459e6b10e73cd5e8afd5cf80dcb6..604bcc7c3d88205622d485e5662d73b3a7d7fcb7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:123df0e5d75ade9b2493e63192cb2eae592d5f7d7fd03a8da96bb4aa0bec0222 -size 89305581 +oid sha256:cdc5ce9cd57be8c8a8932c174e93426ee89d7098584c35b8b8e166aa971b32a0 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt index 8eee97c7db895d0c8a7c7d8734e67c658464f095..678042310551383ee2fec7b18169e9e7a74d968e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:88b0e57f62a0a27d0976868abb681b5834afb5e4dd6098f04aa9cd2cb045fcd4 -size 89305645 +oid sha256:1df0d0d909b6be8af47db71ae7be92d7cb2e4b1aaee00d2545b470fb16ede879 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt index 8442b300f13707ed3b463b6871d2c4db0a69f0e3..f1d4c8b51def25fa08055c966a7a3ac8de71106a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0b632ee036aef9b46e1fb348857143c901d8d14be7f1b472c1084c43cdec8c12 -size 89305709 +oid sha256:9ab5cdf126eb938e6a27dd61e3c50f4d4b5767ada1cedf1764ebf557f492de1a +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt index 4230a29bb3ea65c534b81865521f7b6d7ec91bab..494fe08f679f2baf77bb0901cde94d3c1053eca7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d967d36fcf8209a8c118d50056a164a770734028d4e6ceed7be25a0267398340 -size 89305645 +oid sha256:2597d3dea3e0466e7a302b632722dc985fb1e2b9eab7fbf9a36d7b13085381ac +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt index 42bc7196973a941e92599fc992ddc70ad9a77db5..7ce6e3f8ab6226b65f2aa12a91482dfb2f38c313 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9a85e5f588c55b53dad25f4f495c5ec416df445378d3b73382cf876d52db4524 -size 89305570 +oid sha256:4fa86645a0f1e623e0375b1e00c0858146e23236b1d1ab7f37d73a0e69d655e7 +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt index 678db34085abfc6f3c87768f2a75e0fda4c36ad3..deb3e4476d237240d53eede76c4cc3fa1c27697b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ebda9f7f3d62bcbd9bda11b1ab0c4b979f824f4b1349b8ef284bd708b683c618 -size 89305709 +oid sha256:a1f8406cd6634b9dced8cde1804aa24fd50fbf91c9a965f3e44a449abd42ed72 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt index 20cfb973598d1fd0ad53ddbdb6d1c73124ad215c..45f4252c11a3a08ae18e3324238c718e5bb89ce9 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ebcb9a886e0a93f68da3cdf7143ae61b1d79f88f94b5dbde29b32d4bbfab2f52 -size 89305581 +oid sha256:c868e3497214c6047096b898fd445fe7e816d64171a5e2cb55d0bbc7f75fdf1e +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt index 5c0e97c4c3da985f6578f8b38559c44c8ec342d1..3060453e8c8f2f91d1925fa0ac9a606bfd9dc1f1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ec0297bd6d5ef3288cf19d36ef55c75139fe037d7fd95053d0c189c9c7006113 -size 89305709 +oid sha256:561eefd890a0c4741d0b24b126651f4d31db1f4e516e4fa3ebb5b103a0b3e171 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt index 6f8c647b9332b1cb6ce172fa58ff102f30ed9fed..4fb098b1434b6b2a64e3ac39d0f92b10f2bcf0af 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ea89615de8f4c23e9f515874229858efc4b69fe9102533b3d1851bb72bac172e -size 89305645 +oid sha256:da9ceff52ddd76d7333e459df0e912cf22f24dd67a1927c6c479b05793519b00 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt index d77c179ac49117d6367381f378751ce5799277b8..6ee91acc71803bd861fa76d2256664c4b5fc2681 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ca70b60c8e41f91eb4a7193ea39100979d12b3a0b1583eb37b7aa19ac953d76e -size 89305645 +oid sha256:08cd6c6e758228d9358c24a911d8b3e70c33f40c3661ca51faf968dc9e7200f5 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt index 2464d02e4d8e1ab2dec3ae5bba6308171c77f7f4..00df95cc48371a92c1cecfbf5604d5ca134ce4e5 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fdffe3fb904e168302a5b2d7e2b2fe3661cbc8af01cb7100417e6255d0ec780a -size 89305645 +oid sha256:e7e4e2c34f73d6d0bc0592c41b9dd2a6305f9e06fbccc2fabed34add47fa0fdc +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt index 4d2df913b62d74d32278f285a77059a1ecd54d1e..440ca9d8dca185d2bbe51419c95e326829ffe08e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cd481428794598785383023aafd9088aec7b1644c833049b98693186f9f80ac6 -size 89305709 +oid sha256:befc7f44b7fcc56924d9d8183428eb11f51324920304af89b3492ec2109a9cbd +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt index 1b4fc9789c9536aa5f99fef0a8f4d6e8b96324e2..9f7f5df692a901f9e6ea12bc70aca2ea95e25679 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e0a7abb7c51f7cfce42b1929340afefc37cbdc0ba35b1755e2e8eda2641c9b44 -size 89305709 +oid sha256:75c1b704959b67b4ab05aa7f45d3425acbf2e9a01d773c92c3a721de973b6b72 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt index a60f498fd5370f950f8d64804bf703f5222dbfc9..ebb6b98c330d8390912924b412d13b3dbd62dc83 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6cb536b1e61aed279b9f623da917f87441d083ce4659b78641de005b225ebedd -size 89305709 +oid sha256:31defe5c2b515ee619cf01439efab1d02122bd856115a17a75af9c67f0d17dbb +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt index 1a54787ae499cae3e179810e0501b911c24940a8..64cf88b378d49abebf3c32d221772df3496421a8 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b314453187fbec8534a968b704fd77684b1adcc76ce300e1272fedf2213ad1bc -size 89305645 +oid sha256:aabbc8f3b6e308c73bdd2498d066153174d7c595d424c12ec4963dd73ef177db +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt index e5bddc0f1e7c0e16a20b8ac928e63e3432db793d..585485b3d903f2202a09f58219baa052110f2c69 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:63e1a0908247d838e401e726587eed26c7a87a066c3492c5b2b25dc470a59c52 -size 89305570 +oid sha256:d55c3796d1eb6f80600622c4f79ff170257d9ce53f362bd7b579d4b4a48df3bf +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt index d712a2637ba038d5b211d2598b7fa622e133f8e0..67f14fe4c83807e0e7ee93162093d6f51f64c11a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3c28d2fb9eaedcd55736085f309c05fae67ae2d5e23f504ac825a8d29e313c9 -size 89305581 +oid sha256:8a0e8613fc36491553dda0ec8323b2fc04fe9251cb6c974828a593f332c9b8f9 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt index 4f962118a8c0feebe95dcd340ff38242f7921be3..d4b39e49ff636d40665c6b2f3d3fc9e4aa9b0286 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bf92712c8225c8a88e00dc5c603bc2799994910a36db00de56008071b80266ae -size 89305645 +oid sha256:fc1fcf0176f8b8ab73f0b502cbb1dd82621a311b11f7e9f4470d0308ebcaa824 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt index 0e9924a87f859f47431d01cca391417b62196436..29ea56b90cdf52b19f1c8a37b36cbc7cc9029fd9 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eaa4aafcab3a9c201a4c35bca28a40f6333d894f0f7c452ff7831adb73c360e1 -size 89305709 +oid sha256:2ca1b70d37ab68befd00845f60d36616a3e3605cfc27d484c7db2e90ce866c47 +size 102174189 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt index c79727f1afc3fb6d2dea903167e2d94ccbdf492f..e9d10ac539804a5d4409ed800d83a091ae3a4fd1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bf50c8d56656e0fcc1a129f5b0c48ebefacfa4e58c362376584cdebebef16e59 -size 89305645 +oid sha256:0574f57c1a5951e1a3560f992bf848d35c7d8d5da6f15dec111634c90d04f917 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt index 5d85986a33f39e03c8ec8086005ecc6a623ad94d..f8ef692f99dfc60219397b8ae9d6cfac90de58b2 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5478456746eb86c84199e2a126b3f3aafc5ca1fcc43a763b114c1066f038ff26 -size 89305645 +oid sha256:25066d0438581d0bf03bf80b5f05ef6ff3a70842d6128e86b3eee1eafe00b95e +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt index 30d1632dd3ab26149477fb7baabccd506d867b05..c989bf7fd620844ea2e0ebe6ad3c231e578366fa 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e9c76035a7eb2e96a6ee130a84784f2c288dbce93a7dcbec20f7a8e50b1fdb3e -size 89305581 +oid sha256:5048254012f5547faa2c11840cd10195c76988514891c6cca9f40d6f3581f240 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt index 54eaa9733905f46e1a308f667870d105acd461f4..3edcd13c227801a4ea9a4f4c371d46299e9c6acc 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c1f1ede5d2ef283b6c222f187db342a478f1a4edbe168c3e91ff4c2b50995554 -size 89305709 +oid sha256:5d97c86096df03cb8a13ce9e1b035cf54c4bfce45899ececeddd33109f1de980 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt index 594a86a41cf7af10c90df6836cb4c407f7e0aa9a..235424d77f8e56a973ee0bcbad46e80a288af96a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:90e2fcf8e0278649adbeb87ef9556847951335668e6c3bf9d3df6d53a22cda14 -size 89305645 +oid sha256:5a21816f6f68ca56bc3716e3b68e0c674b8cb4fbcd6eeada493caa8982d35888 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt index e831cbe762ecb14fa6fdb2cacb9566cf6fd6178f..354858a552cb1c0f195d59970ff1382ba56ebb15 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b42ac1028d120cf2637c1099f7c62fa9bc623650738b82c17460fe4c9e9f8781 -size 89305709 +oid sha256:d4c5c7ebf0e5da8bd70830c53340075373eab91edbd155eeaff94b0c7d9a686c +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt index b2a1af550789f85b320f8b3c5f79e0bc05dd59f0..7fc456fe2f28ec03eca04e03c76088fe71d24cdc 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:156639ab2cce89695cd83152ed31cefa2f1fc3fc71798518dac9326fbdb0546e -size 89305645 +oid sha256:a3fe99f7eacc7c0f2e8a0f190100e60bc8417708545fe461b5e31a82bf238e36 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt index 27237ad13b93c77f09c1e6920ef7d5d6133bcdd0..4c536794ea0ab2f77b455ff41891232137827c73 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aec045822f04f8b6f0915c7e2aa1e120304e0961ac2da41e20709777e56b4cab -size 89305698 +oid sha256:2f532863d647e0d413fe87252f64a3027169aaed91578bf14859d98643b01c2f +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt index ccb1150cd881e739caab23880a28c6eda4168cca..d6481dd0661c86fbd279eaa4f8ce120ae76fef71 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0d084ce025796954ccba580b4aa4e46518b8f82a64c442909e985730a933cb3c -size 89305581 +oid sha256:4499efb32297ea7ec6bf5bcdc6fccc4cf91f7d527787d12497ab1bf1e50765ed +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt index 1d0071aecbfc42a81671f9f7c0c5a073a1bdd18f..fc901c3ccd0a8034630d72d28997fc239bbe5c76 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ab6c6fba288418c0228da077b9a34291ac5d815c5f7a98b23f4c4e59b0203931 -size 89305709 +oid sha256:4fbb8c9bbd143f2e6c667298bbe63334ea731e92c1c2dd0342b2788bd8fb6b14 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt index a9365be9dce57a5a18c4b0a533a3c91f24e19b9f..15f060fc7fcc53e8dd383f3d3531f3b866d57aaf 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5835cd562380a52db40a1e48c432b0937b94c1079343719bb94fca4f7d5340b1 -size 89305645 +oid sha256:4d9fbf133bee32e02d4f7c9cdae387d9ca005de71264e3f6aaa018233d18901e +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt index ca77c4de8e1fe1cdc6557019ab4b6ee277e4087a..a2460942ecc38a759de9a9dd002d27ab19a6fdeb 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d0b8acd7a697590ef333985d69575bbb60913fa5bfd8dc269e8ec9ee1a9a7e86 -size 89305709 +oid sha256:f9ef7dbe1e7c018a0c72eb8d796bb4ee6b41b222f9ce46afeec927d905aa02a2 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt index b5067c4404ee3027f9181d0907f22c2a5f2e0a9f..6664058882f49e509fca2bf7d4cc659f40ad71c6 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:22e5912850d8574db35214697ba33fbe12308559a3d4cecafbdbe5c316feada3 -size 89305709 +oid sha256:1a615784672a7f23358fc55a7e46b0c7dfd1e7ebd9521990338f3af491eeacf2 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt index 03973bc2ea001872bc8740d9424e6ee05472d985..a034b7b8649db1eec8455854e8f2c484efb6ae73 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:12eacca0c3f1a80970cfe5fef5884afb804d281f67fed622a3b1b557d3937a80 -size 89305645 +oid sha256:ecbb888a6207e34994f6d86f0d88460883111d2d5a11e429f23448b4b1960402 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt index c8870a6926ad2983519990d4f33e3957b6c27332..3b39e652f1c88835ed1263d35189574d6cab65c2 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ed047356663dae12b9ba8c3a09d83c9713efe32359afb804b4485fc49488160f -size 89305709 +oid sha256:477029271bacdda0dad191ef1f26ce46c8747aaa82f0f3bf0fceb8562e979f19 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt index 3d15f8294aa4f115fb4b6f83d4c3420263c82841..dae138db4a299be73a2c8b08e74b2117ce234e1e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cc515ec59a936a154c59744792fee9d7a1bd72394d01c4d4c53c58aead79ee66 -size 89305645 +oid sha256:6e95c04cc8240b367ba86c75f3d3ca141428aec74bd90207dcc83a3a7eea3cbd +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt index bcf814e51ff72839fdaf2bb1a5668faa2ba98deb..806dc2c2ea340310f06d13f9c8947eff4762f93e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cf9db091269c0764981e496f2c059efc0aecdb5b1dc4236ab11b615664cd26d6 -size 89305581 +oid sha256:abe57923c0f8851b69c80799584451520b6dc0313b29f0cc64d7f662120a3455 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt index 43c5c3e6063ff024ea4aa5d3597d9336ab72b51e..e7fc32f949446114e45a673eb0a142f5999c93d7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:72d6b1cd0e02ca393d023c81d07a451739a22f49080bbeb3e83f617b7c49b698 -size 89305645 +oid sha256:f8904fdffd8a48ddc737c6af40c88521e37cde9cbc0f6002b6642a977dbf4063 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt index ceb6549da6e443f4c871d296abd8fc6402d9d17a..4fcac6dcb9aa8c15972f1be2983e48f8372881fc 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f086a5039c9be02e6b3a904e958ade7df2c417c3763ba9a7bff015f404d51812 -size 89305634 +oid sha256:72e9e320c4c3def2d7a346f3fdedb8016a9152c0c13544428e85be7ab3beaf8a +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt index 4e44be0727760c8fa0aca7332ce0f12931eeec27..fd5010846256520a9d3645c6467469fee90d03ee 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9033f6c8f530a742ba94bf7dab46c1dcb01572c9ca74071ab1fa1c5c934d910b -size 89305773 +oid sha256:45dc12c1822db6a1814d8e7144ed94112b088ca5a15953c28d77c3994b824fd3 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt index eceb7e21309faa1c1764443746ec6688a835f766..e0980216218d7ee694f0a4f15024afe241946dd1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1cd0b96af52d1847a2fd6b5b76c1d811ce3064834ee2ebe7c9cd568a5d079ef4 -size 89305581 +oid sha256:fd2928496dff2d83843f641bd05d237b5a35055f062de88aeb801aa697614c3b +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt index e6ab38693feedcc15996f90b674a7d7faaecc4c5..b09b738b679b2823de1ee416426dc0d77ad38fea 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:894f0856d5b9ec726feab49c4021b98e85ee1dd4f29709f40fc71858ebc6e3f9 -size 89305645 +oid sha256:7bc48e154018db4ca6bc4d064cbdd9158338b93232e50299a9ed480592009209 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt index 76c5f31b0a3be04294d9c50d35c98078bbf298f8..a4294219d741189a77235b8f3f99ad79c59d493b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:87c98898279867fab21c6bf28f9ae091b97dc849dff042197329565d3525fadc -size 89305581 +oid sha256:0eea92292c719a8cb42156da094218fd1e8766a334df5678ed3a61c59e3d3ca1 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt index 462cc4563a2dc008ebc3039c86a561563a51c529..49d3034fe74eda1a629c366d3fcfd3db57caa482 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:64119acf51cc336c277d05c0e1f4346b350ee650daa3c86413d09e1c80343466 -size 89305645 +oid sha256:f0979cde69c4a5a8b06cf305b67b04e8fc3047fdf3202672ae86eb8344afedaf +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt index d28c8f0ee1d05d4df6fb76697134b96dcfa8dac9..eab741a29ce42eadb415014487d9cd02bd012b98 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4fdaee2bc2b06d64c41ee2a4c2a1f34a3ac4a86087a4beb6eda581cea9b26db4 -size 89305773 +oid sha256:8e9f8bffe32f923f3563c60b2b4af86c0e64548c4275eb873ee364927cdb2caf +size 102174189 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt index 1452d114b53a75e3681c267a970a0d7f58746bfc..25fd4ab738bf9da49d8438491fe0e4ef103c3a96 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c02bda7c5ff1de054ad23d01b058ebbff169d64bfe5577c77fae123e0fa67846 -size 89305709 +oid sha256:68439d169a2396f4863ae9c4248eaf05da886e117c06db7a2466ccb3f18479b6 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt index 1f54c690118df353c985820c75f4fa77bd37092a..4969aa1210cf037abd3f500f10e08ae9fee9c6d2 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a42bfe46aab3f7ab92b58065f42ee9a54e2f4fbf722deb515e7a1f73e9213887 -size 89305581 +oid sha256:ab261cc6ad987e2cd26379cc8bfac988c497b3147689a48f6154ca0a8085b3aa +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt index 7bd9f20e28ab0fe3f44e1d16f0b5e88052d8843c..95ae3304265c01e327d8551593a17b3f72f91246 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:61295a7d0c0d7c441440d2fcd4426976750db7a20c75b8a90c32f0cf76b04512 -size 89305581 +oid sha256:b9cb4c93374f3952fcb293c2488a7f0ec1166f0fcaa7d26472cb7843a6a35175 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt index 17c870e3e8f854d343c73d0bb9a7008d7bfdf92c..df3d3a1a0e34e2d92accd101801e040d9fb51265 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b2bcff9ca4f5ec25b0ad3cfa4a4f669f8fd2cf3228d4c936e5b090507c4d257e -size 89305709 +oid sha256:89b28026b07e3d3048c1e6875bd683a345f0bab3400dac225f4e57ffbcdcfd8c +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt index b82bd9ae68be62a6f20b4caefbad8851218aba68..1eef19c2dffb59770a604343969b63234ccaf0ee 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:823774d6930edb9488f0dc83788a0e50d5b40b804d7187a87d9d3daaebae0cca -size 89305634 +oid sha256:9148e67081298de1a5981c6656381875e814c1597c8c628c807cdcd9203c6bdf +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt index 2a739d6b36084dcecd9beff732fbaaaaaa2cf0f4..5f513eab5895a5721c55da2a618aabdd2229649f 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:826eaca6e317e00aa7f53338331b59b1c1d24e041212d86a2e6aac37467ac385 -size 89305623 +oid sha256:a8586a4dd22c03e43c12670578932a9cb40f07c0a523d10c87467e2633fd3716 +size 102174039 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt index d903722ee2d347ad4ecc5a8fec6cb4b90f7a5406..b36a05dcf61e1a0a1f11faed3b86e2e5625ecc1e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:185e91cbc530d0bbdd34c69485259dc834c68e627d5c4ed184f766593c067690 -size 89305645 +oid sha256:fdad0179597fb079be3c79f4307085663aa49f6a7b4ae1864d52e4b8ba1e9727 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt index cee37576dea80131409efeab1b61c7cda199f1c6..a01d67728a538ac94a7eb17e6309c6e29cba1bc4 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3efff9c8e7dc59a3e4d5f49f9a81eb3785dac2971b8a40f2bcd48c66f7fc010e -size 89305709 +oid sha256:987f2b2991c23999c8a87df4d9f8f37a27f03c10ddc00bcc5c9b85494dfcff0e +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt index 2b9391d090c213c62d4f558daa5e9a1a359e9aa3..0113d15e661214ecbdaf59583e53fe63cb429fff 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dcce157e8170119c02b6378d789ffdc1fc6acbad55c0bb491aad4d4b09099635 -size 89305645 +oid sha256:280cc142011be0d8b445298526cad9b5a51b347cac6b35bceba1c43e3cda4767 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt index 5b8f2a9ddd48094db5fc0ec7f319277e1048ff8b..8fc73e516283543551aca83db9f1b1fad5dd0149 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2169642a586b0c5c02ff0028a8654c22cb2c60051ca2841ef096a0b97aedb52e -size 89305645 +oid sha256:dc08a99cb24e7cbb4d0d88d3f784aa56eb0ba1e2da18c19a32d91db8a27c6956 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt index 287b6982d17decc4c1316ebd03c20efd5e34fe5a..ceb1113afc74f29aa2b6ccd8e0fd5c252ccc6363 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:06b8a6abb14df9c2cf1d8d67885a389d628bb592159c77487760945a3203a74a -size 89305709 +oid sha256:d17fc57e88bebf997b8afc932df7955b8e6ee317fb8749d91dd3e7ab9219a75c +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt index fee7c95986f8f6fc942c7613a73bf19c4c8ca029..d458032ff0c0b60f2fb43c988960cbfceb89b388 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9bbf9ebdbd1b9a989ee5e5fa5482fe5bb3646cbc5c2be2d29a0390b727c7c800 -size 89305645 +oid sha256:7ce5b13417b253cada971d757d5e685a64537657942cf16f74fa4e017dfe1e97 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt index 8a2966ae8f7a5f2b3a9fece49e630f988ff7114b..aba3a0551b19e15c7b761c9d97a65331127a1464 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d598800e8777ec03a6f99877a2ad6b5b9bc6fe9155d3731e6659c102b6736129 -size 89305709 +oid sha256:1829fee9e91e12bd96477f22371c8753295b5afdf806d20476f21b24bd859438 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt index 68ec163f5cdcf45e0f02daa7713a613385f03e3a..58bc6d614f0ce3a597314d169e496cd1bc2b9c7b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:34a330d467a7e59411736b13df2b0f922399803496fad4e95d89938449f29ce7 -size 89305581 +oid sha256:736e2a78f862310430f05767c4a77b1f998d1714965491df39e396c0feb8ca38 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt index 9e541c6abff04ccb5efa3dd44584f3d58aaea3f8..0b229c43a25d07a4b1cdb1c257568570d50fb8a6 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0151397f1fc3deb72953c387f0afe2103f796c88014e4fcd2d02666a31f82021 -size 89305709 +oid sha256:3d115a28d759138f1972e9ff76c4b8e5c3a02855dccee49bea96b2681c234669 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt index 9d860477dac36f9925006eaaf321a20342f2933c..181e02fea143d81328886a8c8afac5aa7b0f48ba 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7578380259026f85bcbff78f108558823a5e13c97f36fb5868d41677eeccddfb -size 89305645 +oid sha256:8841b1c08099307d396378495bcf4174e6778b77781092966b0c6cf34801f72f +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt index 5d2cac2803a9f408a79a65e561defc9b11cc61d7..fd5963677b7e8814602b5532a199014fb8a0f45d 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5013f347e1a90ac2fadd4cd3ae89adb88b04459cd35a751ae904f1986ce434d6 -size 89305570 +oid sha256:605af5e677bf792961ad890f087c00d59313f1e7ea5a636884e00086d294d8d7 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt index 4f45b30be27aaf67519b14c95d0e411efd124df3..30a66c0727c1da779487ba6ae9c7c1cfc7860d1c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ddcb619a47b4a3269366d3f48b4175c1ea71f4bc7d1b41c1de59c42ceb0c22b -size 89305645 +oid sha256:dbbfed5c777baf786500d06f9c63481594a3b2da87790b8bdedddda72170d8ae +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt index 371dcaee57c8a33e247c37c78ef98163fb7c703c..af92b646fe6f3dd4d0853019d83d46dfaeef213a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fbedcc3de69dfa686a1d8c22ba47e29c6c3d1403ba250b56ffba522079fb21f8 -size 89305581 +oid sha256:5bce7024bfb7e834fef12358f84c4872738bf5825994f1881529ee48d8d330ac +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt index bd5019d4dbbd643e0d3fa1db63c974d266efff32..b9d35c7a521377b1fd37e41a1243581114d7fd4d 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2127297aa0d7e937c7d52bd06c323a62a0dcc44dba3d79675099081c53404cec -size 89305709 +oid sha256:bb11b148fe7281fbf16ead3beda70ee4d54bacb4eac50b8712f554dd4db7579a +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt index 1eaf37149b85e28b21f4c83e47723cbdbe6dc9a7..f0119258eadfd5dff78389a36d467e946dff335b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b8ea9df5349e793ac2b07c76aae0f8871a95caa1690d1da79f5cf97c88186d25 -size 89305645 +oid sha256:8080fdfc3ef4d017f518f44c70a7c23b32bdab2547794e06551fd1989b1e96f8 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt index adf5dce132ae467174a55e8242d766c374b2abe2..e8242e2e2259aab13709ff1e59782ad6f7adc7f4 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e4104999f381a1683141bb138db95b72e2f4a61006f4b820d0e09222000d95a6 -size 89305773 +oid sha256:322130e46a583ef8fccd15d1366862e2a817e5b1b161bf9ced06f066a5b16108 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt index 006612cfc0aa6cce61f765a12c4b14307afc8612..d3ace79794c6b2e2ad9f7de17656c36fd6913503 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4a66cc1059726b8ab6efd167c9bcbbf2c0caa392b85c8c5ab80bf434f587fbb0 -size 89305581 +oid sha256:889278aa1b70878e8dbeb8e7706dbd9e5ea31f95c213fd2e3fbe4f5eda53fb0e +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt index 16c1bdc6819f4951797a8bb1fce41b99f461057f..29d7fed2ec6b0dd401b411a288f8406c4ba9c35d 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5e363f1ab061a145400ba18802e45596198df5f14038a068a4c04565991c389b -size 89305645 +oid sha256:4c8503e924a38b30fa1afc0435a38ac037f4d518de2968c0b57868da654cad07 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt index faaa5cb32fc0a5448836f8285b6300a5d0194a73..c8de2cbf9c8ff03b375916bde4067419fb6bb75b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c9c78541a0cef9b65e773a3508db03b534d413c168cb957eae45e6c7d4ba7594 -size 89305709 +oid sha256:3ca98e595cb33e0bae9888bb32b5aa40032d0d3c51be65381a97c359bea34f46 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt index ebd4aeaf005f9cd487d1242be880704c076731e3..5964d1ad0e846212d07f1845fa462f8d30e9d92c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:58d5f433f96c86155855fc64e810fdf3da68cdcc4b8e9e7f39b3f3440af3aef5 -size 89305645 +oid sha256:63638c55e1b55130dae9c7427c43156b53ca96ea5d056d9256b08c1e6ee6582e +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt index 1c2742adc5db3888013caeec1b0bc0aa133ef178..9b096da58bf7cc0bf8990b039af45fd19e3c90ab 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2f93319f6755575fd597d6e4be6a308916ae5ff77fc55eece6b38f9a33a362b3 -size 89305645 +oid sha256:acb45da735b8f185a7328088b072231ff188dc9c5ab115783863dffbf29e03f1 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt index ed09742d212e216667360c71978ec1cd573ecfa0..2df783214abffe50f74cce1b88c5a559caf3f331 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:24d9bc52eb722b67a5c3c2b69598899f442465e622609255d3caf10da1b52e8f -size 89305634 +oid sha256:da06ec0447d807da49918e61151f5fbdbde660d72b7d2f5d8c6d9e366523ea8f +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt index 2e22fc91d0e76197f721e0ad796a74ba1f558532..4ac4006061901082aec065bee607ff6e21c702b0 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:54178d1c98b64e7467d956a5135d7f818a9c16859be9388b03dbc5492b908637 -size 89305645 +oid sha256:61437c58f354cdb090e8b7a97c2c519ab484e86c525fb055e9aafa4e2fd346da +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt index a6e8a0a7586fbc353558a48bf8630d01e9485c5f..1cb682233d1a31107db8b45a74ff0d0eeabc6528 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:28ea04e496915a11b4c9fe637b04d57bc801394c2e990761f3131dc2b3204cc1 -size 89305645 +oid sha256:1921ab535b9e219bd14de981354f0e0057614919f4605f47d4625f9f08b3f49a +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt index c62af4d7279bb0be77240c8a902b5c8096cd2c8e..2e6ece3f3ae100ec8c095d691210250ad08303fa 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9a10ac39fc3e171a3f7f35cb72501a86f814a41dd38627f0c9b8295bc03aa18a -size 89305645 +oid sha256:0097ab9f87a2b38cd108a2cc4ff6430dcd8b0bb481005b39c66d113683026b0c +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt index 2723c6d4856fa1cd92681a3a99c89ca2a776c07a..e3d14e9862bbf3cdbe8831080211a09ac47f5e63 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:19bb59cd2ae814a76b89162fba2b840af5e73b3df2d1170e7831adb8e3d4ffb6 -size 89305773 +oid sha256:64b5a270b5a661861ff1d562d0a4814c69aea8d1a87f41e97eae36f8ed781943 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt index 96d28b18af4ca53fb5c91bc222b7b17aa7c1b3e0..8fb8fdf03c421c65dcbb21a7f0e56bef01baf3fd 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a1ea0ae20a0aa871f44ebccf17817ba7e4356656e0f4a1108d72e6e253a5b1d2 -size 89305645 +oid sha256:8eed3479c8a6affacfa20d5a663b6dd2fcc2173b4be97590a7bc2c0f8f96c2d7 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt index e46da196869686e952ca88a5f62b967d8d268aa0..fdb7a4494deeb31ecf72f120fee384bdc30448b2 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:071a9e751ac64da34d21586e26344a53fe871e3809e5884594dbe421f9d9bf6d -size 89305581 +oid sha256:fe885d5ba4a92d7d310dee1c326b46e98e5129671ae3ae94a1a6c7aedd172554 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt index f0a57ceb61ffe77b58fee09dcd98f80442943f5f..12a1a1c06d33feb322bbb6c8f916b57a92f5645a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6b745033745e6866d8e7cb7cbbe63b632b7390b72168d437a78a6b2c2b6d9fd6 -size 89305709 +oid sha256:e38cdded07c365e24cb4317fcd56f19454a78e5ac5a2618af49cc64f64b68b9b +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt index d6d0486c202ae6455dfed871debd722bbe2b1e08..6851e5bf0c8964f3c169a6b5f7a48e699af53dcf 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e0c94452bfb32d9086bf2a551c79198bc968bfb47607cfe9babda543dcd50db0 -size 89305645 +oid sha256:9008a401a898e5f82a705a41758fdddce2aa32d3198813bbdcb8fddbcdd973d3 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt index bcd834c890e8bccd080dc67b61a518a2a0b672bc..12d2723fd2335114d760ce5bf78c1012f920ab94 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ae04e04dbdca696bef3664e7cb5aea475dd63cf7fec4cf6b196ebe3490df7e70 -size 89305773 +oid sha256:67c7c69cc98d20ae664ea4180bd5a1e7c12e53d0ddd88be926c57c1488bffeb7 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt index 78e35aeeaf7b2f0b24cb24f3b2459713af6d95d5..050e1f684d3ebf180634391bff53c1e9e9bc912a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dfde63d20e06a4c28a6da4aa2b4499e40f3a9c9b064764e69cb7fb0f9349a69e -size 89305581 +oid sha256:50f2b8595493a54bb838b52ef8c303fc37435b49d68fba5413a6a63d6671aa2a +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt index 1156df6e8ee557616e9d96d2a8b11878f8bb30f9..dab8a6324fbd4da1dbecad1b80f926ca484c2a15 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1866a4eb40dd3f1f9eb99d321b4d9880e99d77bb05f1a2da8d0965fa3b3b42d4 -size 89305634 +oid sha256:1d9b04ac23a2d8a04fbabddd5112e20f1c3f5ed94d18443bf9a9803cdbc15047 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt index 8e37639e384aa8e0f3018937ad41ed2c6c4d019a..0c545bae221be642cea04f741e8510a503e7d85a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5389d9305e968655cbd119476a12fe087df0586cdb84bf1c06b0492f7da83bf8 -size 89305645 +oid sha256:a2192fd05ed8d9f0805bac0af5dd78267646f5356ae926526738e394eed81216 +size 102174189 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt index 744270b00f83cf4b9d27586ce62379003ed7d690..e3e6b9f008bace655ab192a28859371a4fa1af01 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e957f97951e04df9b1cc9b0d090182a4340ebd2e153118a027ad4d9c8d25c76c -size 89305645 +oid sha256:c9cd98a66845a33f74a91b08414dbc0afa8cca7623aebb0188ebbbcbefd32062 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt index a0faaefd82ebd659469ea6543ada923949694846..c4bc48d2ce99cfb5dfd82cef26b6e9b3b5da2f89 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2485f210b3b55fc7bdd9dde10c2876d8f7953e6f25aa2d1289de4b74b9412fe5 -size 89305837 +oid sha256:ade0562fb05809cf99362988de635b240266a501f349576f7e08e7327ffd634c +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt index cb5763c08707854cee0b5d195d5ec310614428bb..c4fb519dfa49166f1bbb7e8ab9c49de1c60c875e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cbd2793e15af4ec08c1421301b23c90a07c001126223663076c5e1af5f520b4a -size 89305581 +oid sha256:8521d8cd85e4e229940154147678b67d3da1d87f1a6604a68da7de4d4c59731f +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt index d6c818785a06ee0eed33f48246a2c6cd3f0286ec..c2a1ea4755e51b49090c93590c40a879ace20748 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f3008938a1a6445434e790f83722993ab2db91230d83938440fa7a42d5133624 -size 89305645 +oid sha256:efecc2daa712aeda04136762921bb1804a62f63f8a2e5a49c739c56d0b3881fb +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt index 9629f175f8a7e25aadcffc01848c0b823f80f4e8..263f37d34372a78a38931e4f40abcbb2cc660f34 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a1d369863020f1617472ac062e3442f7b4fc081b2309315f43a4f969b816b52c -size 89305645 +oid sha256:49bcb04939f204065b2a09eda8787699e73a717937135e55c2899dd9ece907e7 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt index 031270112d935ca9a25982d3901cd18907ce8b21..5dccfb3f00a7d2c91f7e80f76df07be70771fdaa 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:acd4c400e9de3bebb946df7c748da3d37f94302be8a8ac1b6dbfd055b50331f8 -size 89305645 +oid sha256:3c57c9b5126484c533e79f58b0c5d1463dce124cb9ce8f9e8cf87189276ec722 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt index dae61cdbdbd964e86af17a740be779622e0c44eb..508f6f43db030616d68fbe7606352db0ef1da504 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aae547ba4b60906606af26cc5074e26c7c421dcd0884274f72c87d63ae326a46 -size 89305709 +oid sha256:c23f2e8fc230aace351a035b22e0fc807dec3b915a76024131b3c8ef11eba05b +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt index 1b96b66f9cb3627781ac218da33f9a1d2c952108..3f019713c4c98197f3a2298b8c7d7d745097e4df 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6fc5924a133ab0ac434ed64678f2f98b6be4fb2d7800c117c0ea13f1181aa5b3 -size 89305645 +oid sha256:5815df21f8b073efcddc30d935402598700c7ed13680e0b716150257205702e6 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt index f9f82c304473b5bbfe9b2d8c6481b23f6c85ee70..e2c9340817b979fa6a45c62cc5e17b0f932d4ee8 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:da846be0d66886f13dd5e49a0d969aee57e63340be3ef3771580b32130aa6b5d -size 89305709 +oid sha256:e2fbc1883b28e0a47e29c2fecb2ddf0fbd2be528fcc9c54478adc74362fe1d0d +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt index 2aa7cfdf5a36aae9f2c2e59f1df155aac0a1b744..be9965e00d8c49313ef2b9987024c95cb0030984 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7b7fe13ffe96bdc5acb6633a22cc5fff6fb9fd5a5aac0bb7d8a56d7f053189f -size 89305762 +oid sha256:4ec0985b67ada8e0f36cc508eeca9d726370f9afff64459f786a5aa4d9caf83f +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt index 9f96caf2ccf63cfa47e08ac196d941395ff68a96..842e553935a80268c1bd96161576ea04f62333ca 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d31b4032fd752115941e9e60901603beb4b6a29b39c210198983350d4645b04e -size 89305645 +oid sha256:2c835dc9cfa772caee995c1ca0513492116c938df8aeff3a33a1836cd8d3c761 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt index 786ff62b4f4f756efe54f4b31f6478a1bf650507..7ccd26b2a0ff7dba53178864efce3cd02edd9696 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9a982435e8010dfc8613ed17c0123d2a03475dee173796e9ea69d33c5855acc1 -size 89305645 +oid sha256:70a1b12f796dd8f258e6bfef3ee927375f413e96cd645eaa87129a81df3f346a +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt index 1766599a23020a3aa14149131529afec36e9c0bc..b664e942ca95117d12d65680652cda726608885e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e16a7919033f0d83066e41084a5f42d951d56d8dd3dd238a28cf6512baab1883 -size 89305709 +oid sha256:5319c39e968d0ae9b3b4841cbb47030da658e717859286d02075a7252242fb6d +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt index d9978c1e1b17b2138e80943088a6b0554fc9692e..d10b55ee045f60d27539366d604820cf69c80725 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0d17c35c62115c06364e8c22857abd7def1181c0dc1c3c9c6b4033e1f3e499f7 -size 89305581 +oid sha256:988cba39f014f625115438a8a2a5b3d80fc7802689353a42dccb2b12e413c7f3 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt index 580e7111a316505e5ab72bc05554a487280541c5..83b75281edb073401f6d1fc8f0604d9bfd847f12 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fdf5bad0b509c0f68efd5d19a3bf997bc104d49af8d6fdbc82d23bfcc2d2548d -size 89305709 +oid sha256:030e66668e2081a41c80fb82ae1d6b55b8cfb5a2629e84d6ce02a876c9c843b5 +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt index 68a9081a054f22a6abad3579a4f4e17076e7af89..fa84ba665a31c824a2cdbb6b744e3e4d2eb8e5ca 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a429b07486271dd632b424a5625c6b66e78d674ccc1674e4f8dd4408aeefde7f -size 89305709 +oid sha256:95369b424d08613d6e4136e96f12acca1a3b06c2efc3e30d51cff28e5238e5e6 +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt index a7677a19575d3854deec9b5415daecd0f053ba47..5652d6d8e5006414c8c8662ddfa2d67d1c2964ce 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d1382174f470e3816922303e1186d9b52c2fc96245fa3e6da759a861d05ddcb6 -size 89305709 +oid sha256:8ef969b5cd4f0bc156b331554d3f1a03c34737bcdd8d5dc9e29378ae5497d01e +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt index 7f5c1e690f7846733ac33d01217b05004c58fed0..d6b6b67392bf48a477230b9f227dfecf8c53a2f7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:775ebf011db81ca2c457737ee4ba24f15bca58d6f31902d8d4bf7e748380f299 -size 89305581 +oid sha256:64f0c978b62ce92dc44bf599f70e9c8960d2a06fdc019b1176fa3ac3360706ee +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt index c92da775eecfa45999a031822493f4e3ffc48ed1..958ceb4ec0ce283bd78c831d5312ee406afe72e7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5851a31e4dc32a86de8e866a89d62ec780cd04f761b319e65257a754325185ed -size 89305581 +oid sha256:da2e1071ef8e5dc105d84a365de37838e413bec527de9ab7a8e68efb7aa0c2ab +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt index aa9d210cf23160c3834dd860152a779466eadfbb..6bd52d2326054ddab5d08be389f6b1fa98495463 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:67d7f455f17e20b165caa998a756059a008dca8b78d46cd3b87a0b2fa7f1ec2f -size 89305773 +oid sha256:fd856c7b57a94f84306499c9414b17277c0ead46dcb44433921bd8502b57deaf +size 102174189 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt index 1657314b12208598830045200662fddeb6988117..96ad44d8ffa6aef01f9270b391021932c1f5a540 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:db9eaa53970019781ed3335ce62afbad5ed41b39860c5da7e9a646203b266228 -size 89305570 +oid sha256:49a1a8a4173c083fda65c8ff0a45aa722f0040f5dea8efa305d923a3d879a256 +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt index 50dd098fa6189b6b014e7bf9d67b99fc3573dd79..24ff13e6b6a98725b6b6a0a2fa20f9613de0c2b2 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f0704b165387d9b923c3291f40044cad0f9783a506cb2a9780922dca0e516a2d -size 89305773 +oid sha256:30cfa8624733194b4026c589be45246d81b3f690a1fb6b5b1cf62c55efbe868f +size 102174125 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt index 2978ae480450a53e83b7b15000f85fbade9a4775..00a79aa690135ab284168a57c803cb001aeb400c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d105290b3ac5f1cdb0931c8f29e339ce8690f17f8e61cf3c35a8c2643758dd14 -size 89305645 +oid sha256:b2ca265c6431efc8a57bbbdd0d6b3124a4ccec6427b076f7dbcf49d3791d47e6 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt index dc634cffe0468643c3c564fe0c8a301bcd83771d..bf899815ee4ad49ccf21bcb9b07a8a6a347e14cd 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7a6d52631d2b8e3ed4f8119070c4629dbeb321b60800e37b3baf2c097d27eca -size 89305581 +oid sha256:1255cb0358935e5a8c751b84cdf4d2d7fd75a97b281f458d930e586393d85726 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt index d0398f8a1cf6b263b6570ccb4a8c40f660c33c98..7a7924f65546f3bdadcd296afa7244590479584f 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fda3c948cb5697207f311f4224b332094e0598e159b7150f8c485afed17bf10e -size 89305645 +oid sha256:31aa0ac6f89da4e3d0ee85071874256cce0393680b259594d6e4ce51176d7a7d +size 102174061 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt index 45d1bf259cb09935a839ce1d87e24679d49efb24..1e93fbc8e2a8a80263aaed9cb4854217957d1142 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:359b78d21e1ec5df8c72dfa7eefe0c99f5e33c21e81fe88cde6313a7a824d4c6 -size 89305581 +oid sha256:0ae4639a3f0f437114a2a6996aae6aa257dbe2b82987bb78a127dbd5a1d97705 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt index 2cade3af46110836fb5ac3937d115cb3fc49a13d..f37d1eb16a4c98fe4c8c5de2ae7cfd04b83cdea3 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5435ad327dc8a75c0bf3bd4542755aa46e38b44befae99f06381590f4ead5462 -size 89305581 +oid sha256:f558d74f713b1975b7dca4cdbcd69975471d61c8ec692fa5dfa762d43e7fd691 +size 102173997 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt index 8042322f96fd83b75a0d68f44203672579d7ca9c..61c85840922e7491b317f00f23c4051717baeb22 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:966f42938103326236e2e0dc455905a988bd299aa8966a529ef78eb53ce02c81 -size 89305570 +oid sha256:befb5b2632d3ac002c56d5e48f0d18326cc4ec9a0dbf4481403cf3ec3ce2ea42 +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt index a443b43bc88da6d3ce39986d1244fe423bbace90..30c684b073b7e85a76df30d2d9c0ed1dfea49109 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2284f53e0c2780207bb79e20b256c8302fd7046443e828774e2adb3fd5752544 -size 89305634 +oid sha256:d2376b2ebb321bfb30ebfaa68730e3677bcadc3722ed3080f2a5bcfe5b1ff6fa +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt index 365e400d33b8f802bd14e595649823c4b893bd66..08bc2158bb8dfba967fa8d29ae722b92ebe83276 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ce0352a36437961a279bed977d19c16781470a6183699d62c5fece5e11ca41f -size 89305698 +oid sha256:0820921b0cd92ffd60cf83c0fcc561f111c9201cc89d4b01d0346c6785db0ded +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt index 384e8c78784e4be1a9e9b9111629e2f1fb84d1f5..fb8db6506ed9e5b6e464be93092733a3cb456e31 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5b9712cd0c02dcc74c57c366faa274d84c3a3273569f11b0d5e908890300e2dd -size 89305698 +oid sha256:d32f8e9c542491be781e3fb206c41cab3cc974f6d6286c888fc51169fbbcb153 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt index 7b9a38c5dd58263c64fc4f5708291a5be03b9371..c2fd9f4183e5c1f1bb3f175dc435a84dd1fdcc7f 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bfa522c877d0e267df5c02b87706f063b094a8c714a8e9c7de9e84a38689f83b -size 89305698 +oid sha256:41525a0fbabe8d8dbec76c7f97dc087079780ddc87eaeeb472df8eedd15be1eb +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt index fc35c56d3608661afc405e6989ba81c1f4fa0fb7..51bb540b198c960a3110a92356f7a32dcece3f0e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4211fc80d3c9634782135f183e5444f6383426657ebd01cd87c5338a85640033 -size 89305559 +oid sha256:9e44bd1c3a81ade953d973fd87fc4dc94d9d1e58a5231046b4a4159fcca02735 +size 102173975 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt index 5aec8050dd8507a8ee567eaa6b6a843b136ab02d..6caf2229bd3e11a0ca5258f5436d7ed38388fc71 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:42cba6b620f1918f8e893e2e87620deb08bfae772e39246700b1656586ba09db -size 89305634 +oid sha256:5218357a4ad3125b4dd1e0056abd13629cb90fb84798772e9925c12466797e40 +size 102174242 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt index 77e78a5155e788b9c4e8b0a9760f3d1cd7d9e7ec..c81e204feac473c1154fa695109e32d29043957b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ef90d5637a7f115bb808c0fb39877df66ea8c1fc44c655787ddb119335828caf -size 89305698 +oid sha256:bc4aae4e928b7ed37b5e875b06697ced2de1e397eb79b9814c9b5548f05a6b2f +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt index 8b71cc2dc5da374e01e0cd89ed813f98b68e4eb1..83d8c953be3786b4e160fa058c5ebf97bf8c0985 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03d868ac93dc3d2a15ec6c79cf661a00604058f74f26e509e51017752a1aa57d -size 89305698 +oid sha256:779d832bedc0a2bb60caa447c9e8487660a7e334074234c55de2139249ce684c +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt index 42475f6979ac17242da061e8a44e85be8376a397..1a4c607106d712b2c432e01b7965dd4695e17655 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ebf0f1df99ff13b484217ea45dc4e937d7d96240555261a0b700c79ddd25583 -size 89305570 +oid sha256:c29e82704e877ace5654d5bbcc74d1ff4db71c527348137e9a535bcbde2861e4 +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt index 227f39b4c562da245cb9e8e1084298c2c9d96580..7798073bdab3bce263cb466a9d2cbeb815038c15 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:67780b310d6a356ba29321887b3ab3585b42e5f94c392a5f85ece5f69eb81020 -size 89305570 +oid sha256:adf50024e9b4ace6d2b880c0e96e31a232c7684afc624ffa173f23f757845dff +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt index 6949d06e1be149ab19d43ffe1df074a87d04c540..df4e23c25582abb3e2e03be1c372471bc2c51b3c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:16f9365325f794de749fd005a36f95f02897ff4a92038911afe10694e762b295 -size 89305762 +oid sha256:0608e9e7374a5e8422d38ceaf3f8ffd5b390ebee583b3a654e4ca5a33e16b968 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt index 328e0066c332ff7bd49ba273b9fe399a6ee3952d..d8009a4a8ae9af27957e4cc3000eff5e33c260ce 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fc7ca7de1bb2602de55005e9e3fca7be64fe292f4fd329a0ac24e2cee140027c -size 89305634 +oid sha256:d09b1cf76d2f9778f4e6fcc69b71bd0f3761b8fb3ffe5d64489b974d78797b30 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt index d64b5aa105a6911709fa0366c7dfeaa103c6f62c..5f2303324cb98697a7fe5d09845a384640725bd2 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b5dc94b23c8af1f4902e17dcb7cff197995813a5575eccc9d9e72907237a9a42 -size 89305634 +oid sha256:c933e86981e562d68c19b700acc70f478596b1db49d51f11b2fd17de21638fc5 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt index 43510d865a99ce656ab0bf132869d0a5e299662d..4fe2c4862f5fadcb8e59c10b72e796f9391f50a8 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6a4644d8b6fde3b09a2df38d0597c250277b067a971cea09f962a90c3df33ac8 -size 89305570 +oid sha256:f045f60315e5fea89dc202d418eaa6b0117e7ce0bd14d2cd09374d8b1e0fd450 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt index bd5e3ee2dfc9d1a5229ee18c754fc56d8e6ede16..d3cf6e9715b628bdc301bca104c4e14c637e6a5a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e13bf2534db3e59a398ba7decf29485295e3ccddec8c97ff2df9175feda7ea43 -size 89305634 +oid sha256:33bfaa2cf77ae35eea54ebd681698a6db55fbecb136813cbf7b253224e74d67e +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt index 9fed2bd3720a3b91e90cd7a4f4c59e7a7984d693..a64fa37e6bce6487e799c20a2106891409b58877 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3e3da35874441f1d7d155a522062132b9dca91f8fdfbe8abb34b39d4d63e7d32 -size 89305623 +oid sha256:9be9fcbc4d7f7fbcaf52fefe85f92f3f7ff59eac021300c96bc0240830eedaaa +size 102174039 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt index 3f8e56232ef5238261ff767bedfd827707b14a3a..fa09005888dc2c8e017ea08abc510f89d159c5ad 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:72e927f1a6dc7f474a3e9aa1d50d22794d8cb91df695056477c409ad3019d2b9 -size 89305634 +oid sha256:e0d74f2d531c3bcd452f252dd259d233bf8cd3084cb135216475d78c13b18875 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt index 2fc69b48ee4d03f2a3fa877931a0248d256241a7..650fed241284824b01037cbb7b8648922a90edb7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2d94a12e7df6691e0372cbb3b8ab9816d5f63454bf7d6001958586283c1041e4 -size 89305762 +oid sha256:39b6929aad1fbaed9d7be6ffce4601bcce80df89a508900d75c2d11b97c5afa0 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt index 54fb67e4eba7a5c82b36273386337090f1014327..5472883b0a6d1bc5a6878ca0ea4add38abef38ba 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ae86fb049f0d14915f9f74becf0865138226b9889616e5647201fd7bd37ad2dc -size 89305634 +oid sha256:423bb2ca7f48cd4a5695f40e13ade51db73f3a039cbb1a739425db7516aa7a9b +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt index d0b2b786e536557b2ddbd5115a7c5115c6e3c554..64a79830a659486c8219a7f42c05c232a1a2f775 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e8c0953ecb99b9f3b9bb11db206383d29b5854ebcdfc0531929f0e228086fd81 -size 89305570 +oid sha256:3d0ccc27276534df1b8592fb3d989d7cce1d3b1c054a22068fd31a4f742f8002 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt index 7617d2b3623e4d92c974ffd4d006b19e85355390..40b6cd7fc4efb97f2b83d4497e6f794e7f46130c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e1fc718aac7a1aeb79fe54cfc6177a9391ae8b257c04db5d576b68dca72a3a12 -size 89305634 +oid sha256:70e808bc1db3733ca60a0f4e759cee0167e85432c74fe1b05d3d68a12499d2f7 +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt index deba4ac80f6532d3caa960e981f48c3a5466e1c1..3384b8d916be6d2ed2f38b19da60c577b7b8e5b6 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1068b9246798184326a7df25fc7ab3385eb98be6b21035776fc52af1db4b554d -size 89305634 +oid sha256:aba5d380c2d2bcfed5e9492513d08c1269029d892aa21f825ffa9ddc37e25f9b +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt index e6632d7eb43d901315ba7b4c0d771e28e4634e70..bc2e184b9fc64533ee269f2615f576cbe6638c71 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:239c58b815ea3952bbde891a87932bac0b31f8268f8412f337a4c7aeab1417be -size 89305762 +oid sha256:79a2a46714033cfa3cde6fbde2cc84604aa7bb5587141f96aa621937a31817f2 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt index f112f3df938412e1e0c442fd0e09596c8e52e88b..f09b207a89924a70570d2c1c0fc8794942ad1951 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e5afc9a09663ca2cb6be9d111de8e0e7ab550d546531fb08d9b8442c263f82d7 -size 89305698 +oid sha256:9bcec69902ac16c673de1559bb8d7a58c68ad41376ac84362a32c0401b0ef950 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt index 1b5880c0e967f7337095e4dc84cff26b87d5dbce..6cb8addd760ad2c1876f863f11efbfc64f6a59d0 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:94e2c42d635fd7ca586313495be7481581124ec1cf514c85c7ea00c312c49848 -size 89305634 +oid sha256:c120b2758254ca2ac5cc86311cf0ffd56e2aae096db540bb3c8f8b103135cb38 +size 102174178 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt index 334eecea73fd2387c4183e370008d5f1795844aa..f1e1a41d41f3a0c040cf3d56b0f38a2404b0ca0b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d222783c42739ed620b886241cb1eae59590f510688d6426f4728d654774cb6b -size 89305634 +oid sha256:970031b88f2bd351616331a493dfc5d5aaf7dab1777aae19363a620d474810dc +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt index 5046487824a402d419be22e5f682fbdb6e6c6c31..82999b0221fc14fd256b9dc505d4372f16d22bbd 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b539e746e5652e00929b4d4f540b7a130a1eb712e91c5fe403d6114c7285e5c9 -size 89305687 +oid sha256:a69d561a21fc83fef80fd48a5e07454b65b2c2c853eb6b7c52dc4d7d37fa164a +size 102174039 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt index 02c25bfba606a43cbe05f4b2ea08cc0daa3d1cc8..8e0f575294139df1a2a95f831c8be70f086dc9a5 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:57d4953fc4a5910a7792a24a2d6d36256764e1132e663c0af3df224a7d828844 -size 89305634 +oid sha256:f27c374e769007faeea74d7d158b2071275baf5980e0ed37d4235fd19196ff31 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt index e80dbbf815b9a8c5173c1d752f6932fbc9cef44f..32b7973bff1bd0c5cd34ce582b5f00492e8c97d3 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:70e20c95c7c88ea1dda3559a53e0cda8632b15ab6671949af41cf95232b617de -size 89305698 +oid sha256:6ce196dc33eb41831e8c811048377387b6001b99c9150ea64e2ee0e48e0f6ebd +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt index e38b4b8b1a1779d92ea9f76efa2219149d4b73a6..5a8db92555fc3010572637036c0d6bb8d142950c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:747121c86fe79d69ee2296ee14bed737f69b1d7cfc06c5d30550105b3ff43c36 -size 89305570 +oid sha256:d91740fd07a9a048fa31c54065f7c886746e36cdebb0b99188abef46c077059a +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt index 5ca04f15a9e6c76e4b47fc9faeb46e91267b2319..ae70bf343e1bd6822f63fb675005177fe84c5778 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a2724070f1c9d094ff467d8f2fb98f8afb091ef0491f00825d27920fdcef3a15 -size 89305698 +oid sha256:f9c376f246b289612de5f591a2ed1846a3e5d0fe113a5b342da896d2e3827b58 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt index dc2839d75fb43c8992386d88c3cbb1c6c280657a..a4238642730ca41a9bc297c9be0629cc1ce15fdf 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:86b0566e4178f1d065e22f5f714a54d3d5f1f68ab40c61340ecdbe916e3ba3a1 -size 89305570 +oid sha256:102acc459ef3e640c7044455f7c696458ec6a6e726e6155a7b4cd75dd15cfafd +size 102174178 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt index 5b53309bc1fb942fc185583e17bc79fa5612321b..2830115a86d6289dca9e472fbe8ef52e726cd3c7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b84693ebe67ac477b3c8b0ba35638a6f9b424d597a0726501bd9b12840f60528 -size 89305634 +oid sha256:902487fb7eadbb5d32e4654a7558025cfd97d37c94d36d7a63e22400d0d55809 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt index 682bce1a5b570c01fb7c112444eeb50e005e475e..620ba751e2615b84bbbe321d37e8b4430293fee2 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a85287de2ab3459931e11e1d16bf375706a53a3a636c4374c285be2b0a9bbba4 -size 89305570 +oid sha256:47b57635620a183a0369b53c5fdc93185e0bb2671832f380549db46f8595ef7e +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt index e5560c693ae000d163d53c87382f2f4db4df3bd9..12b152086d4b8b677d9b2ca71b1aba112b319a8a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c6f8ab32db719d79f675f4002b282d8e332c6a0e47f19c20ac4c2f473751bb9 -size 89305570 +oid sha256:847d2445c07f3a511a6a6107f82840593a4daef5e67c4e13ce2a8213f2c5216d +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt index 553533babfba9e32e23f957b2ae6e2154fdaf8ee..43ea7d55e72bb2df259775a5a35062a61c995438 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:022431d6a5da3d6dcadf5f9f3d2bd5724e6c7d8699a16f35ec3d6758e8910cb0 -size 89305762 +oid sha256:d61d30bea7f3cc5edb2a0e38435b73dc1416e1052a938dc120d533cc9c5f00f4 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt index 81f0e0aefaae13140cc596fdaa025686b686e2f0..39689341e56fdcf6ea6c292a84043ddfb1f576a1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:89adca5192b17ff726ad7819948e155c32b2f2b12b74d6861b95fd8910cd5d81 -size 89305698 +oid sha256:065c91937da496b48baff269ed1a226c226b2c87f78109b0d4d4f8bda3abd41f +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt index 89d2fc6df49c9c876c068f6afa1bb5979d6adca1..a1bb26ef557c71e5e179dee219f1f3550abed507 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:31516fe3a7fc69bd4d33fdd92e9c699dee07f4ad69655ca747ba51badff699b3 -size 89305687 +oid sha256:67a2727f7d03365f008e88e8caf7ef37379d903620e6546c17ebc2362b85d28d +size 102174039 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt index d472731254034fa6e5210d2dc151baf80ee4d603..b7ed130f4effd1343fa31cdccd6d10f6b5402b23 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:574b76e4a6babdcc0fbcb6d6e5e8eae7644be1ce8a02ae5dce1d8cd0d0181480 -size 89305634 +oid sha256:e93b9fbb6f44d499a81f38cc339990b63c949f0186657b0e40870db23204a119 +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt index d2b56c8ae213d16cb231c5f21da61d1e0e635b29..be892c6d0d0460de09193613f846f3797b89876e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c189c4685b9f3dcb51fc37dd71a80a1371c086ce797958835288f10c22b677b -size 89305570 +oid sha256:2ec634489fd70f40a7de148238c95c385d0291812aec5ad49fae73c9c88d9cb7 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt index 490606358d65d74091adccbc3e905b9f334196be..92daaecfc6eabb3f9c7f65d5eff233a2cd4e0365 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:82c7dc74400c80b2de8a54eb9789a066964463d6fe3684905a68d3acd11ad32f -size 89305634 +oid sha256:301dd8219e1c03ce000690a51a9d0b2037b399c4d5e762d886b65552740d525d +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt index a975b132efb99b85a05d415c70ca731c365ea9f5..70c9c1c1071c89024ea69c4846afef4a2a228e2c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e217fdba2e79342d079fbfb14f250735f7bd89329f0c79bcd30196adcdf9a2a9 -size 89305634 +oid sha256:c5950b8cec565b39ba5ed1511bcb273915e2e9fef9f48a414cd0dd09885b6e05 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt index d1998c3fc3768c2731c6c4b06e169c4065b8bc41..75949076e7089c73c1af5b0ecf21bf9b4633d3ee 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:72cb8bd26ed3a95ce5fb0a0ef3293e4c24b47d76a1277070bceabbd5f5559869 -size 89305698 +oid sha256:95ce04964cbb010a8c8887cf539794ed2a152bd7362e69e83a371bf5d05dff5e +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt index 34443ad7e9f51f7e15f0a469992947fe7ba4f7a9..24feae9a6a79e54dc3230d1b087eb62f733bb42c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:69f7ff424ab2992094fc49e72403eb39d69f973eca2160a2e551cde8a36a369a -size 89305698 +oid sha256:62326c64da36b6c35849d40b3d65898791851437572c0dcbd48d256f286a108c +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt index 62afe8956ad96f693d34d77888a874561a9ce4bb..7213a5f74dc8bb28d346389d4517c25418244686 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c329a55abbd032d649d3272985ee89ddf46cd598cb63d9ca507de3be9681dca2 -size 89305570 +oid sha256:dc52b583953ef23e1894b1e18200323ea1087e94908d2b8cb015e172e2b44b4e +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt index 145e893dd70c74645f60472b008515b76a6cde07..25c2050913fc89ff03fc2af24a0a5aacd59ba0c7 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9386c4bf07e86a4a417bac69ccbc2f0d7d150ffcb67082ff8bc568002a79f084 -size 89305698 +oid sha256:3742712930a040fce459dfab460d47e1ee2982c3a89793a77491dd92abf6d6f4 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt index 96257a2aa58c949be91f028e37d7fed9e46fd786..25d4760e203a0bf750460ed9e8064ed2c011a026 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c24136c68bf8e3eabb4601b6192dacbeb5e80bf8df13b5cc8e5474a44a6b5292 -size 89305698 +oid sha256:e524418c4a726c1a17d0012bb1b4288f78c99120e03ff517b80d55f7ceadbfa2 +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt index 56405e33d50ce4b11ed03ebec1bddb0b6ea7d555..3c48acbe401fc2344c9f80cd4ea58c99afc54828 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ef83d5570bae4c849000ec682bb8abf6ad139a5692c5cc522bf678c7725e8500 -size 89305698 +oid sha256:307b12aaec07146613595f3eae3ce4f5cd78279a4fc8b976429f8b99f92d5387 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt index 5dc05563925fef8dd083f354186faf33f354fdab..5025a906af6dc58b70bfacabae78644630d99335 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fbe37acc1d237c6053dd017a44c43571d8041c784a83d59f944a9725f2015fad -size 89305559 +oid sha256:807471aa2fb37b8781d53b2dd97a8708b5a57fa2331f6f160e1fbbd19b51d6cd +size 102174103 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt index 580a239c1d4d559eb3e3a16b3c62fa650dbbeaa1..410e9bece628eff56f0d86143b3ee156738c4434 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:308d401bfba9ca7051ed5479c31af7a5e94306c245f54b8f599c01e45f2418ea -size 89305570 +oid sha256:0feb96870413691f30a74cc100f519b4ce27d5bb95ce63a71d9eaed6915ca4ae +size 102174178 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt index 225cd25f81e64586af1a4c6ddbe98fa6c16319bc..da8bc321b31f243268fc75abf748e4fb3b43ed94 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:78b9f9122eb59022263ceb2a91779bcbc814c03772fe68f316a3758bc428c071 -size 89305634 +oid sha256:122e7e9a2dea64f60ba44aa73f3f07dc41b9f473b40b8f2d726d566e8859466c +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt index b5b507298193065388336d7e1da736684093242f..668d1d6d79a9af5a393ceb3334e3e176ad9edd89 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6c39cee571508109f7a961155a1a5751961393040a5bbf4adaccfe59ebf8d97d -size 89305634 +oid sha256:560eb0fa116849026dabd7c92ec4a137ea557f77987a5ab38f91008a26bccbaf +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt index cee693367a1683e35154c34f68b7d9648483af08..77d7b55b16f55aa68cf157b30c9d318dab515ec0 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2af13b821c0def39aca681950687ceea308e997d7ab71f219347cc5584ddbfd6 -size 89305570 +oid sha256:995b045a3dc3ee42863808f62d1be969d62c2dfa3e5e71d4533ad7f9e24f87f7 +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt index cfc6839c5712db29d8e5b6af1fcda4c3c7afb666..731360f94aacbf999e59b56577e1ad0fb5a65f21 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2e89372c2395cc3738f662ccd661299aa6e32c6f34c0cee48a3e97695adb0ac2 -size 89305634 +oid sha256:3fb072aeb2c6b33e15009a227a71dc1836969943608f83c3853e540a9e0ed9be +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt index 2412216b965dab7600091219fad7364edbe6118f..183d8e64d7a7c8407148a63cad780066332b41a4 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:491b39a90cab8543731627af5c4489d34587b7bfda20db2b33dbc1c59da5848d -size 89305634 +oid sha256:e815493bf6b0e504138b97e39baa18028338a1e8a48e69bfe56a2d721a5d600c +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt index 56dcfca98d0f061453b4af7927ab07cd5a385314..2bc577842aa7e56974a91799a40fc753725f98be 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df35e9c76cb0f4a9dbd7a543ed8d6cf2dba48e813cd6cb5715680bc03e14bc8d -size 89305698 +oid sha256:f57e25fb9dd4bb7096f48b65a11ad86ca001b4efd054d5f75b0ba3494967a2ef +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt index 2fb3ee87d5398c64cf95bc1981f530098043d428..04eae37490be68e1be666c6f5475ac5167574ff5 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d5e6b9d5a1c987c8c2557a86f3d84d38fbdcc6d6f7459b0897ad4a35d4cea06 -size 89305698 +oid sha256:276e192c21c0f7ae1d4fd28665c1f11030b3ae44267f29bebed3a2365004d49a +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt index 90812d8133baad9b93fa62079ad4108866144a7c..d864d1723e1e0c6d3a91083012ebe3c84192751e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0aacdb9557bc7d375ffcbac2765f0aaa3493a08bf28665b0cfb4ffd59481116d -size 89305634 +oid sha256:2331480f544e3bbf7300939f3f4e2624f90dada10f744ad89b44c29b67497739 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt index dad2a2394eb73d88b62978e0433df0ac34798982..a538ea36846d05570a4696705ce64a5967bb3ca1 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8bd9f76e3d55a0e945bf41a3d4e2cc953a7f61a32d66b6f61272e699145f6b35 -size 89305570 +oid sha256:6b9f0bb15d2c7225ae0ec6f6b50e67ddc9b3655208d8acc3914b6fe021c01b7e +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt index af503c25311e53a05022a82bd17fa1250a566954..2a10cf0f6e04d7be97987982ee21c9198834d322 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eef9f357f4329a1f0e08423484d06922955977a68e490c8c0af8caf3fefd1d84 -size 89305559 +oid sha256:b6e46b6fbbed27d87d35a98e18e1fc5616ab7e77d83546db62544575f956e7ae +size 102173975 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt index de1ce5e0fa5898114385053c6b75378507925085..8bc7d63a88e5ed8054707f8121eeb6ce7f3217dc 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a876daa59f7f4a9b120841b2ba73175a1239b027af7f7b714cf90f35eed35647 -size 89305634 +oid sha256:8b0bd426242125ff331a315b9c3869f07260f0b4ab7b31a9f9b796a3f2ad06cb +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt index c94477e3b1e1013095a16df45bb49ac350084d5b..89c5c411bc9842d9ef208f568385cd41f6193c2e 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df23bd191640698bb29fbe6745bb5e51aeba230af6dce199d9aa72ec727f92c1 -size 89305762 +oid sha256:0562232e1fd704a41e9bbbbed5d60fe596baf91e7d0b5e161cbd30b58b6f02c0 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt index 09f9c8845261385b1495d81a4f8e2c461f928f0d..c9e353503c8c61eaba1c5059eb4814f4efe0eb57 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f167b9483604bb223f35f7faf738c3dd7902a85a7e89d0ae13bc0b563a808f9d -size 89305634 +oid sha256:f900c14ce2cbbc78cd3249ad7368c4f521669c972be98bb023579dd020a197ea +size 102174114 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt index 4fe023278e2d900823702c7f3f4bf2c2e9af3f67..872731431f66b55a1d9e4fd19a06277ad8cce2ae 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:232fdbe4ae9e04ff5d2d2cb190114b57540e05518908145d595a981f1eb73139 -size 89305698 +oid sha256:9c18393a37e02753e483120a27f6df5f33c6f8b44188d8d5cfff490862a63519 +size 102174178 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt index 354f6ca5663892ff22e832420b303c1669795e17..ab6cf8cf56b997dd3c7de28ef6c16edb5f3a94d9 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:738517dc275ce528c7aff0081de4dfab1ade25e319f388934522c93c6820d024 -size 89305634 +oid sha256:7934210e1c7691499bf78534b9056603efd731233af9a202adecb3504a618bce +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt index adaa4125d029539c7f13862d38bbb890e068a905..1c8e6cdf723652518899dd24e8774cd44f317132 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5854831ec5d2bd01aa3dea43ce0c24ef4326fcd55f2b5189e147a0e828e90e92 -size 89305698 +oid sha256:68b60376a6b1496cef9b6af06f38e8a2bbd7dfde740c340e871987a2c92183fc +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt index ddec5e5b6508612160367e6fc75e77eee92a03d6..bb1064c533dd1ca0fd9fe36a0858749d3a21d39c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3c5b4b5a07793f1eb517b1805d37caddf81a059da6558d9c28e0e61664583c26 -size 89305698 +oid sha256:33b6542bf0dfa0071bafd2215f1b7f29c04d41031729e7579a716c3d83694f88 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt index f5dbb4c465111bc1a779b446cc5f732372740f8c..d5879488f14b25435095e1e3b2f46b8c361023e3 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bb1fc829ee6c07e5c284fdd301f4d8149a825c4392883a2d6f6ce61755a70ad2 -size 89305634 +oid sha256:d6235be0f2e89cd415fcf23b0bfc493f5c3ce65417cf46e3757112204ad14aca +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt index bf76eb44e3107270d570571039873c75b74eb837..20e4cc7d7288b08352cdedc7660bc3e0ba1247b9 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:70633538228c4a7c96c64adceb11cfa56bcb6f4d5ae1c5e489be082d7cb22aa7 -size 89305570 +oid sha256:32c1e17262d4b5c0385d10785705c0c2bab60dc6c3bcdf15f4297013bb2bfe11 +size 102174178 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt index 6ac51afa5ac2decf55133be04c2df17294169fd3..39401417b31d011ef2734f1c0b7fb0934af2775a 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:27694e88251abc513b5490ad30907a298813648cf2a86d30b01a3122a614345c -size 89305634 +oid sha256:edc423c4cf6765dac070e37144704f987e0394d9a2c88c87a91a19cb13516d8f +size 102174178 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt index 569d9faf2f32898e201b6d678652f3c46268303e..b2761eb4d3e0f6efdd03b3b3abcc77b8b8c47f62 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6a6fef7c09606e541810258819a4e0fb32b36c31b885fb1f24107e642ee90a33 -size 89305623 +oid sha256:e159bedfe574d3fd46e797c14d6ea6ab4c0492c068dd5851b58d041485a40ea5 +size 102173975 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt index a2b7692c0e35e0106ed35f04e76f69f72e3a1613..a636d9f23dbaaa6a0a253a20ca3bc31cda4fcacc 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a4606e072994c98399ef1cab4652d9f06488aec2ffa595a86d16841a042d157c -size 89305634 +oid sha256:0380250ccc5ead0c107e14c763744f68d298c114a465a2d45cbc004fa00292c5 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt index 3f9fc2b2c7681de14b0d19fe1c42bc19be0bc1cb..df7b64c39d95226d137b6c3bab7b8d4aed31c38f 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0860f063b214cae505ec54566569a228b81cd0eb8fcb293d261951da4497e9b2 -size 89305634 +oid sha256:c4678bd0b51008b1c6778949a3a14a694e34f8e203c89e93706fee33b8f7101e +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt index 84142e77272a687d298f76970758fb01ee10586e..b19469df19368aaa8d7d25d66d4ff6a047625083 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:15a0424c2648b6610e4fe04912528cad67850d651c03a25bef7f952aefbe1df3 -size 89305634 +oid sha256:d9b788060ced1871243bf455c53d016f880f3ef5dad269e3c8cb1ac46b88aafd +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt index d54547a7a57035e1cbdab5f7599e856567d07c2e..90ebbe57176e0303936e1d07a82f73dc2978dc20 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5033e559a57bcf39d744a2854058454774071323154edc39d6c1adeb77d68fa7 -size 89305570 +oid sha256:64ffb260890c408e3f17a4b4469db8a9010c4e1c9a7c80ad68a697f34dbe2eb0 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt index 8228178a67ebb4da6ab1a78b512265a7972108d6..af5bf0c7b379407a20e8bc7f2dbd6e6c8753bf46 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:421c910f86264a273baa6643a8f96d6938c971f523d823877b526a531566ea6f -size 89305634 +oid sha256:0b1828c98969f702d38ac3537890cca2bf7cf1a70ea82f6bae7954766745e1e2 +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt index 2e55905ca1a3fa3847e01963043a6e1904d02f44..b406a689827af64fd012151f3526d7b7f5d7cf8b 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6e3081a72c37c5a0d100be6acd616c1566488b7bff1eebcab8944240d87298c8 -size 89305762 +oid sha256:d977318314136ed6fd3aaf5e4f49b1d67f61b4602add115658a36456d19447cb +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt index e30520845b9b110b8859f25fb12064aa22c6fb48..9976b1692773bbc41d3b3660ef1be2b04ad96cb9 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4eaba0125e4370375600fe66d8c7dc0b118d05108654fcf1ea631976644d8127 -size 89305698 +oid sha256:20080daf89ba5cb236435e9b27c2630308a5e3f744873f6169957044b415db62 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt index 31017edc270569e08fbf346b27d152deb2994fb3..8068d55f83e5f5c2dedefe35ed33d719faa49849 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:75a941daed2a2b7b17cdeb689b406c443dbfabf6270aa36c073013a3df1682e3 -size 89305570 +oid sha256:8a1f3398d7478af155f6f73dca3fcee1a0777bb28ed30b9dea398ad1c331607e +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt index e669bdb49f2cc0b15a84250d3b4947799c3a0318..b8b81550926f00006527ae011f22c6dd86b72e4d 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e4ba962255d3bb5436706eab7cadad1953e347eaa4028dad9c1e9998df8bcbc0 -size 89305570 +oid sha256:64b3dd79bbad0452c691fd37d7601a48376d9b0e2be18b904436f946e772d1e0 +size 102173986 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt index 1a3aed3622658580b9e21759820d2c3107fa17b6..a3f06fb6d863dc4fb64b4d2d56966c7c8c20a5e6 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ee89e2dfcc23ea60ec58981cc1dfb0fc94d22861b6119c4c96e3bbb38f9d94e -size 89305698 +oid sha256:6e50d2f99e504420bc604dd4c6df50a860ff1796bdc7ca7cd2c42d7a37fa4bec +size 102174050 diff --git a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt index d2758f6341443a5793d0d07a34ede85c9d7cc1ad..f9582de9b3a466191c337ab97ed71732d016ec3c 100644 --- a/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt +++ b/2b855b9bc4opt/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3471931cdefb12e0a94631600a3655be2da64562730d81809e7aa96f091837c0 -size 89305687 +oid sha256:9fd981eff334555c6940ee28e156a5af9d938f7ff41d9e7fb9d10b8323ea55a8 +size 102174103 diff --git a/2b855b9bc4opt/global_step70393/layer_01-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_01-model_00-model_states.pt index afffaa1bdfee039f6a29c4cb47baebb3745fbb3e..913032e212f7b72d447347c49db7f9f13d2c0495 100644 --- a/2b855b9bc4opt/global_step70393/layer_01-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_01-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ceb7561e97daf4dfc1c57cbaee9603e3e350a948595a2b157a8c56e5d19d19dc -size 241239299 +oid sha256:b65878a1dd21682bc4d6e6c4e94f05e91cb484f256d4133a025f0c9fb9ea4286 +size 268043523 diff --git a/2b855b9bc4opt/global_step70393/layer_03-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_03-model_00-model_states.pt index cffb6914285e86e3678a12b836bff2093380200d..3a473bc80859cde92be0dfab642b9f9b739509ca 100644 --- a/2b855b9bc4opt/global_step70393/layer_03-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_03-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6f4205a17fe5029e2e80706991a2d418aacf8e597f64073be9a482da12e9313f -size 127466243 +oid sha256:b181e8398650ab94aeb634b317f696364bbb23af4b924f4e8240587e71fd51b3 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_04-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_04-model_00-model_states.pt index bedddc877647b46dd18dbbfc1a71385d068658bf..52e3d997665d5ba88b8071dba5063212448e7a74 100644 --- a/2b855b9bc4opt/global_step70393/layer_04-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_04-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7697fd50cddef42b4bdfcd2db9b52075dc6278155ae925ec8e8eff72281caf09 -size 127466243 +oid sha256:52b3cb668ddd17f15975adb0643eedb8421d5312f879e571ddf008abebf610b0 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_05-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_05-model_00-model_states.pt index 648fb0d81d035f07f3d35d746c300100c7cbcc5f..9a540d7a61f7259a73a013a8efdc1be2953e5872 100644 --- a/2b855b9bc4opt/global_step70393/layer_05-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_05-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b2420e48edf2c9938b19028b6209fe72cb8caa57646f1681c0420d8d685424f0 -size 127466243 +oid sha256:d36bc19164e71f9211417c847046f311eb155b3862a6470882065a642ac3052f +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_06-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_06-model_00-model_states.pt index 02bcbdb6d61eac793883a6df4ea5bb30f51de1ab..b93db04c81edbc2881db28933b295ce09d5dd46b 100644 --- a/2b855b9bc4opt/global_step70393/layer_06-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_06-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:731237d4ea735ba05d62a1263bac8eb134a38e3efb25fbb22363b41bd026c0b1 -size 127466243 +oid sha256:a3136618155ea4c4d8415f6d5fb41b5e8caee4f644af2e095aa7dec1df58eddd +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_07-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_07-model_00-model_states.pt index 8766abb39c670160cb51411314f57123323c0b4a..c9e30f3f74aada8b4c85857e0a166d5276c8f094 100644 --- a/2b855b9bc4opt/global_step70393/layer_07-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_07-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:04235917a2a905bbd10e1e9416bea4776e7281dad4bfcefd2c7975019af4b018 -size 127466243 +oid sha256:e87d683ff7f41d4da15c531a484f5ef9abee240eaef31a4f72a74c8598d61dc9 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_08-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_08-model_00-model_states.pt index 5979b5c513ff1e652f32e07e1706dcc475085519..5d1c532bd83ec380c0b08c89a60c72929a943ea9 100644 --- a/2b855b9bc4opt/global_step70393/layer_08-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_08-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7a54d536e8dc409e071b83b0ccdb18914b680ddde030e0687ea36e512a463dbb -size 127466243 +oid sha256:2a0f330a7506b14587f098edb6c338fff43a7895d5f6340a753015e77891dcf5 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_09-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_09-model_00-model_states.pt index 1bb14bc335046b2b6759433543f0beb6a4351996..9d7e0ad37f201d0d16d4b3671d59118fdb85555e 100644 --- a/2b855b9bc4opt/global_step70393/layer_09-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_09-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ea0808fe68dd8e50859d151731bd0e13def2867929fc03fef93b4a9efceb11a -size 127466243 +oid sha256:79195a8e9ca01fe5590259cc634a5d5194f314c95a555f64adb5f48a4cd4f791 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_10-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_10-model_00-model_states.pt index d3fb6595b9be6a4a231602995d3c90cf4098ceaf..e85e4a67c73a9b9771cf6d253cfbcfa1cb692a6c 100644 --- a/2b855b9bc4opt/global_step70393/layer_10-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_10-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:79601a3b6299658a1aa76da1ad2136fcdeec608207b82a7380117633c6482b1b -size 127466243 +oid sha256:7c4f00f66693bbc5134aa872ac03ef1c64db80fe1bb300f13e45433d97419644 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_11-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_11-model_00-model_states.pt index 3c9545ff2b8941f9ee698489fb7d9a76148526fb..b46eb85e08ad3fddec55f4c2c6e92e4c622a7f2a 100644 --- a/2b855b9bc4opt/global_step70393/layer_11-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_11-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:08baffe7c63d9c9f31b62ce3862fc6b01ac8a8ccccf060c08bfa43b34e6c34d8 -size 127466243 +oid sha256:5e61fa93d4c13d21946b6561796108695dcf04e6672e5cbb8ccb99690cb0b6e5 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_12-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_12-model_00-model_states.pt index fb344f7c66f41e2561ebe639055152ea87a63399..643fb128ce1b5452335e28b5599f17df2ba961de 100644 --- a/2b855b9bc4opt/global_step70393/layer_12-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_12-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b633e02b32f1052a0ce34446f7346020f388008a867698685e2f6bcfab51c173 -size 127466243 +oid sha256:9dc1d5cd8421f5e6a9297a8b4e1cc63ebbb956f5dd340a06ffabf02bfff2912c +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_13-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_13-model_00-model_states.pt index 39b80e11a5796afcd7813c9b1f4dae4d4a4d5e09..232db9de78375a23ba822943ed78ccc8fbc4051d 100644 --- a/2b855b9bc4opt/global_step70393/layer_13-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_13-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:40040e5f4eedfd6ac917e719ff0f90aee27268833386d69f42f05d0b3c35ed69 -size 127466243 +oid sha256:4b5d4738ecba61c2f2085d7dabd4493295965f98b3add0a90a08841a09adf527 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_14-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_14-model_00-model_states.pt index 1c6cd50de246389ce2dd995d17c74afbccfc5750..f7df9fcfccd8431adb8708ee5befc3e63a85d167 100644 --- a/2b855b9bc4opt/global_step70393/layer_14-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_14-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8e752eda487841f592832ed558db9fddfc167850f6f8c4f1c448cc41c3fa626a -size 127466243 +oid sha256:ec732fdf47189b990f77b4a1a47ff1193f143cd5fb620d97ed718af0b3934a72 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_15-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_15-model_00-model_states.pt index 0c9403b898453af906efa9fd17779ed044cc9c33..d31a87d7dd76a32993419886fd405d3087060296 100644 --- a/2b855b9bc4opt/global_step70393/layer_15-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_15-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eda59a0207e9909aa63ee819b281347df6c5a38d6d7ad200c45ea33bdd01a1bc -size 127466243 +oid sha256:14772b4e2fc7991e81a16a495c9bd644bd1c7c8778651ed5239cecb5515dd673 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_16-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_16-model_00-model_states.pt index f73958f3e8240fc85162a7023e2ef3414c37449b..744c7df6062ea113710627b8a5ea8dfa409f84d4 100644 --- a/2b855b9bc4opt/global_step70393/layer_16-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_16-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:134f26f3dbc82e569c670174717bc1206a0cbea8c04b0d888ea515a080e47cc1 -size 127466243 +oid sha256:c65e4cf6eccbad43398d5a66fd84875e75954b48869263f0e1cf1b9bf1834f65 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_17-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_17-model_00-model_states.pt index 9b5a1de23fb947cc42b72fe48f3596d2d31a63e6..2eb8a8254d2b6c5041ad1faf08a14e2bbfce3270 100644 --- a/2b855b9bc4opt/global_step70393/layer_17-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_17-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6879f017c1c4011eac69a9a0b334cbc5158267c67028cba80a4c5c9511e2da16 -size 127466243 +oid sha256:4083f4339901157a7a57f50af55fd0ead6e32dd97be70666a89b6ed6d1078909 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_18-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_18-model_00-model_states.pt index 0b19860b8995ad16121d0991e86bfa805bfcc02f..b12a119d2a1bf0515d82bb4e4e662f64393e029f 100644 --- a/2b855b9bc4opt/global_step70393/layer_18-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_18-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d91ab4365caad4868cc78296bf37f6d4d2e937b1a26af311297e854b6ce04b4 -size 127466243 +oid sha256:f28d53919388c09d7237135914d65f9400209446566c19028ad24af0d4a8ea71 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_19-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_19-model_00-model_states.pt index 810c1532be61ba45e5f5ea605b1d73f1c6ec4f54..5cdef194c933ee26fc18f62498753a43dc236582 100644 --- a/2b855b9bc4opt/global_step70393/layer_19-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_19-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:17c2d0a517bc1543f4b4ce73391bcd036f44daf20a5e9698160901ddda29ce1b -size 127466243 +oid sha256:8072d23e5317c61ef3c82e7c8782c3d6baab61ae603427e806b562f6ae0597f7 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_20-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_20-model_00-model_states.pt index 83acf6ae8ed8176787296a7d35e13b9c8b3bfe5c..6096a35d7521c195225dd2705765cc544184c90e 100644 --- a/2b855b9bc4opt/global_step70393/layer_20-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_20-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:370692724712e0347b20f6e001fa67f1085c90a663a35c91d7faa4618baa7240 -size 127466243 +oid sha256:c13489178cd7db6f08b89fe176827f39fdbcf2064afe7a7adaf2036e72c220fa +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_21-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_21-model_00-model_states.pt index 28b9318dfe37b45e16e38801b459d66b661c1d46..272542a31c213ebf664291c0d850cbfbed1cdcb3 100644 --- a/2b855b9bc4opt/global_step70393/layer_21-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_21-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4a4314462218d301297814684c7a520783268dc1f7b7ca7c77b427289b6cc48d -size 127466243 +oid sha256:4989887d7042c68086517c15a70a5d514994455a7987ca7c28f45e9e3d3b59c5 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_22-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_22-model_00-model_states.pt index 399d9a2beb961cc5b4b579bcf90bd832ad8ca65a..3d004d91e9b51f29d6588f09bf8ee6027ee8ab25 100644 --- a/2b855b9bc4opt/global_step70393/layer_22-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_22-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a9e20b04c41b97283e69d65d8cea3947866c93dcf1872f6e2cf2daf4d2b984f1 -size 127466243 +oid sha256:6f900afa8e8a99f8fc12cd208c1488d4e48315054020f3bb7ac7ce3ca3090004 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_23-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_23-model_00-model_states.pt index ca8d1750f1ed57394ba2c2d43502c64aa6d81432..3fbec58d271a76725b4b791b6a9654140a1d1cbe 100644 --- a/2b855b9bc4opt/global_step70393/layer_23-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_23-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:220431ec42e0bccb66426a52629a34c0a726dfd44959cac9a37826b371b2ba8f -size 127466243 +oid sha256:b7507ee0073f30561017aafc550935bf091bfeee84f155f66aabdadec0dd696a +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_24-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_24-model_00-model_states.pt index b50d983e8f6c6068a132d14fe6b233c8246e6d0a..9990900e9cf88685ca620296ccd5cae30232b385 100644 --- a/2b855b9bc4opt/global_step70393/layer_24-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_24-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d7fdeedc73174b20030a84406823a4e727427bce22f8c044e1e12c62fe9b9350 -size 127466243 +oid sha256:59821056b604e5a826e57c64a852c66120a7b23e2baa1b2f03266a8544061543 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_25-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_25-model_00-model_states.pt index 02dd2d87498b75422cd802bd66367449db467af5..4ad4735360f1f9b9f67a3a347316a55608073692 100644 --- a/2b855b9bc4opt/global_step70393/layer_25-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_25-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2be20b7e05b1d7b2f5f3901df724fefaec814c78871d9c778a96c47814727977 -size 127466243 +oid sha256:4966986da75217f9ee6902945916f4a4be22e0b361f4ad28e350df1f51391db2 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_26-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_26-model_00-model_states.pt index 314f7af4fb0549a1b14ce9f28dda7557e7a9f4e1..6ed8f73cd437e71abbf2566952457ac4d8f5a41c 100644 --- a/2b855b9bc4opt/global_step70393/layer_26-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_26-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:00eb89ce9ecaaf423253f920267742b843e2249f84997fc40f29cb120985f04d -size 127466243 +oid sha256:65d78544dbc34456ad267d00fb7011e4acef67e4617ec3c3986688f6ba17554f +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_27-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_27-model_00-model_states.pt index cbcfa7f23a873a5b719c6479d1bce197d43a8fbe..ce061907d524118d031c72c02a5ba1d0075380b4 100644 --- a/2b855b9bc4opt/global_step70393/layer_27-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_27-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5aad061857ccce5729f467306255f73aa50c3a7fcf3b800d3c62906adaa1f9d9 -size 127466243 +oid sha256:641cfabd6dcc2efe1e51554b0b420120edd6b2c414af2ccddf59056344c32a4a +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_28-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_28-model_00-model_states.pt index c6ac5a98fd970c695c01c76846788bbf02fcf100..544089771c6df62343543e04adbabaef508a709d 100644 --- a/2b855b9bc4opt/global_step70393/layer_28-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_28-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:edba7e68edcd80b14f75eb3fad39391f89e46107ee4e7def84a3e24d2c9baac6 -size 127466243 +oid sha256:92f33e34dd50a91c926fac76b3728dbcedbc1cc43e3ace93de7edf80a2976bb3 +size 157357315 diff --git a/2b855b9bc4opt/global_step70393/layer_30-model_00-model_states.pt b/2b855b9bc4opt/global_step70393/layer_30-model_00-model_states.pt index 6377fd21ce328f6213a99f0e84862ad502afd2e6..b1dca95e521eee29b25e2f141ec52837130cab1c 100644 --- a/2b855b9bc4opt/global_step70393/layer_30-model_00-model_states.pt +++ b/2b855b9bc4opt/global_step70393/layer_30-model_00-model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d0f0d2bbd1c0fc90082187a5b8edb29d5bb58724ab3c43ab217630ff22a06b14 -size 127466243 +oid sha256:69e2b3881d6bc11adb38be5d646d3f2f1eb3fcbcc31cbf4a5cd9e3ebc28c8dcb +size 11459 diff --git a/2b855b9bc4opt/global_step70393/mp_rank_00_model_states.pt b/2b855b9bc4opt/global_step70393/mp_rank_00_model_states.pt index 1f4492e05d6be655650b9fcede3539e4fb1a15d8..e6ebe80f92b005c5ff34b68a6fd9d5ccecaf398e 100644 --- a/2b855b9bc4opt/global_step70393/mp_rank_00_model_states.pt +++ b/2b855b9bc4opt/global_step70393/mp_rank_00_model_states.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:98c52549bac982cbbbb3f73bafca0a98bf901a09a23104e89098b83268799d1e -size 45363 +oid sha256:449de953bea560aa04f7b43160b6178f8476c22c5b67f7e7c5e52065a55027bd +size 43827 diff --git a/2b855b9bc4opt/latest b/2b855b9bc4opt/latest index 125e9347a49ef6c31c1e274272e3ee0c7333db28..c83f282b74763fd1dce06b1c61c51b42d6ed9e42 100644 --- a/2b855b9bc4opt/latest +++ b/2b855b9bc4opt/latest @@ -1 +1 @@ -global_step70393 +global_step70393 \ No newline at end of file diff --git a/2b855b9bc4opt2/sbatch_2b855b9bc4opt2.sh b/2b855b9bc4opt/sbatch_2b855b9bc4opt2.sh similarity index 100% rename from 2b855b9bc4opt2/sbatch_2b855b9bc4opt2.sh rename to 2b855b9bc4opt/sbatch_2b855b9bc4opt2.sh diff --git a/2b855b9bc4opt2/sbatch_2b855b9bc4opt2val.sh b/2b855b9bc4opt/sbatch_2b855b9bc4opt2val.sh similarity index 100% rename from 2b855b9bc4opt2/sbatch_2b855b9bc4opt2val.sh rename to 2b855b9bc4opt/sbatch_2b855b9bc4opt2val.sh diff --git a/2b855b9bc4opt2/tensorboard_2b855b9bc4opt2/events.out.tfevents.1683360453.nid006360.71875.0 b/2b855b9bc4opt/tensorboard_2b855b9bc4opt2/events.out.tfevents.1683360453.nid006360.71875.0 similarity index 100% rename from 2b855b9bc4opt2/tensorboard_2b855b9bc4opt2/events.out.tfevents.1683360453.nid006360.71875.0 rename to 2b855b9bc4opt/tensorboard_2b855b9bc4opt2/events.out.tfevents.1683360453.nid006360.71875.0 diff --git a/2b855b9bc4opt2/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683480904.nid006323.3606.0 b/2b855b9bc4opt/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683480904.nid006323.3606.0 similarity index 100% rename from 2b855b9bc4opt2/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683480904.nid006323.3606.0 rename to 2b855b9bc4opt/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683480904.nid006323.3606.0 diff --git a/2b855b9bc4opt2/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683482132.nid006323.18373.0 b/2b855b9bc4opt/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683482132.nid006323.18373.0 similarity index 100% rename from 2b855b9bc4opt2/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683482132.nid006323.18373.0 rename to 2b855b9bc4opt/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683482132.nid006323.18373.0 diff --git a/2b855b9bc4opt2/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683483049.nid006323.26807.0 b/2b855b9bc4opt/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683483049.nid006323.26807.0 similarity index 100% rename from 2b855b9bc4opt2/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683483049.nid006323.26807.0 rename to 2b855b9bc4opt/tensorboard_2b855b9bc4opt2val/events.out.tfevents.1683483049.nid006323.26807.0 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt deleted file mode 100644 index 5789bfb4fb22dbcd5adcf32b6d579127ad3da6a9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3e575cb7fa963f33b362e8aaa0c37a4f72cbde4e33d964804793a007638ca99f -size 102174039 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt deleted file mode 100644 index 7fcedfbc0388fe7957917e1ce42b97182b63fc17..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2d5b3b6c942def0943a85051d75fcb0059eaf1d3e74134ef4c3323eb1c860a22 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt deleted file mode 100644 index 0777acbb84e78a5551cd3f2b79093b73a891f851..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8c3dc5b70c4428cbad46bb2a237995dba4ae2b0ff1a7af68bf8882725dad1fd2 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt deleted file mode 100644 index c9572c4ab1d5848fd3d3783d7be0e4767c839afe..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0e65abfca8f914d559e6f5d72397bda9c0fdea79b48d745e6fbecb7c7b819bb0 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt deleted file mode 100644 index c1be572f1204680948f531cd363e742675767d61..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2ad043c99471b4c22b99167dca623f5a74ac11c2c755ebf996fc6e572beeee7a -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt deleted file mode 100644 index e2ffe4684f2e6665a7a60888653fe59b0f8f1931..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d91c116dc1c49b9917423b60698109c056b75509c2b7dcb35186e12e755fc21b -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt deleted file mode 100644 index 8eab94295e6e358d49445bf56f3b2de328a96cbe..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0b621b138ee9744d7cc2158d3121e91d4254c0468748db965e0d8df36bd32935 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt deleted file mode 100644 index e69bd79fa88afcc653d8cbea4f718508229bdaab..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:12d5b613165db85fe6b0fbb691cebee38d866ea9e21efa3ebe657237423c058d -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt deleted file mode 100644 index 1e653b517792eefff04596677fb9a2af413cf17a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6cce636c34df252cc268b09bbdd047a3284c48d5e12b5888deab429d530b009d -size 102174189 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt deleted file mode 100644 index aecee0b18c7a5a7a568b484b3fd2f565b8d4d2d7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:30fe78336f267a83c6a09d8f2046c6dce2fcba53c75532465a337df062d6b679 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt deleted file mode 100644 index 1a8bed45594e9f28804d979d4860e0183a7b2dc7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:12ef6ee6f073dbe81effe71c38938e7c5a480484231e33b661582dd4ae83e8bd -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt deleted file mode 100644 index a430d8520d898a2b606374eaf775bedda8dad414..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0c1490da4d798720d8952574a91c5a25dc47440fe4597e14f5ece51e28bf467b -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt deleted file mode 100644 index c1fccece2ef24b927e665593c3389771740904a4..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b43f4cd96c95fedbfadce7114969999d134aec9136d6dcc58b77ace11ff0797f -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt deleted file mode 100644 index 3267cf2afbf2251c466ce8bb4d46af886e6732b9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d6443eb6c33a68f2f3ec07e95006897585cbdb851957949bdf33f3d1243fe967 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt deleted file mode 100644 index 671e2e55a25170a5528774a090d89d4578488104..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d7de1c74913b1d219e2ae46b2410b07c1bbb52d25aa9434c578afec1494fa73b -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt deleted file mode 100644 index 48a39e075bc67c2552482551f95eea0784664a41..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:db4d611325f4818dc6464f9def09187322f0f1f3cebe3ca4ab05a23adb84a1b7 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt deleted file mode 100644 index cf6411a7c9637ea92ac9285e25a54dfa8e51ac7a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9b7dfbe1a70526e1b48c0149189918653d5452304ab17af497b0ec3e808ea623 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt deleted file mode 100644 index 47912f4d3a802adea2e922e7356540615ed8b24b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0828ec100d51bc12e2f3fe28a834c1f74aa333a17def29414f369b8100f23a7c -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt deleted file mode 100644 index f203fa93ce221f8987d9530e13d62497c12e5f23..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:758cc6d22fa4adca0778e360fc351fbf40528d2822a6c79d8506d656fca1edac -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt deleted file mode 100644 index 9b85545c6403ddb9363174470e787f171182a6d1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6573591981c16fdcd87d9749b563274f8b2b995c808daa00edac1e15aa48b3f6 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt deleted file mode 100644 index 9e8f6cd5154db82db5c65c7eb7d80a428e0853bb..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2f6fd6664d2edd72160968315e2431db34f708675b1fcaec5e3a7947725f03c0 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt deleted file mode 100644 index b6c1930d975d6843f30d72d45954c1b1b55bd224..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:76bf5a9dd88a132beae5c6170cf3c3797b20fa9b8413309c2297a8efa5aefb75 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt deleted file mode 100644 index f61fb932a148430505f92bf79e13b1d35fdad70c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5fced28298efcb7410f5e31ad9da287f68768e9c69ae1b6a255d3968cff0005d -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt deleted file mode 100644 index 035dcb992002cf9d9329f36ae37f54391eddc5d1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bc1f9732474ae1462968f19bcb30365d6adc968e168b21ea0ba33ed71d29da24 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt deleted file mode 100644 index 6953b8d7241d718fa92f2992f1619d341096163b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:785602ae9978402b3821d6c87dc3903486dc5142371e654c3fc60d20e16f323d -size 102174189 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt deleted file mode 100644 index aa38c3d902a7d91eb855e99f94da6701cb900c97..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6b35a4e0d3d2914bf2a32281623091f655270e5dddfbdbef77e1e415adc32c73 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt deleted file mode 100644 index 4997c4f25f311b012d216c51cdf5294796ed29bf..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:737377e404292d59a7df79c3811678cf82f2b10c112c7f9b861844e9bc32cf9c -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt deleted file mode 100644 index bbc39b0f7189bdd8d1f66035e322e253fedd46b9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b55cd4040cab07fea0d426ac76086a52998101b45c8ca392b78eeb347d222de0 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt deleted file mode 100644 index 3cfcfeda039838feb80cb89d007538004bc357ef..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cdcb6a73be0050be09e4bf8b3cd299d9d7ca79804a1d91e61691f0667cd47011 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt deleted file mode 100644 index 5193720d07a1d2745754edbd85744ecb3570c6d8..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7ef16527255ae855934b52a374d99fad5c83c559ba8f1f8f051ccbc747507946 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt deleted file mode 100644 index 02f71ae68e2f757ca0ab5b360d4d838607eec897..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1b88859329c941f2b82cb8ce4817d082ff61d35e2cb68983ef02716277990a20 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt deleted file mode 100644 index b1af5da7c5eff63bddab0d5135641a7f8083019c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1628d2e0d3addb02371918fa069e71b16cc1d8b84664dcea99d97e27bf290b51 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt deleted file mode 100644 index 4359722588998f71baf0133a24e3792a8984ed4d..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3288fedfe468b05e9a27a13cfa6583984236549dfaeda4f025d155c6a93602b3 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt deleted file mode 100644 index cfb6b82b6243c09241dbd00223802324dcd54490..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:65b36021436e4a7752b67611b633e4778a399a33d7d1bcb10f35cdf411f204d7 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt deleted file mode 100644 index 0c5712abd103d57ac8c7f306d8b5367fffe1aa21..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7fd379f2c76cc2dc40c03e2445cef616ac6022efd56078da85dda560f63f4cc3 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt deleted file mode 100644 index 531208ff2af03acca0be76e3f37cfd835e50bb71..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:221aa370475aec63c56418be36cebbdc6e2b11e9bc13aa5605e9d880afffe374 -size 102174189 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt deleted file mode 100644 index 59a08baaa0cb58b4e5b5d9c0cd036afea1669266..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:59233492d3c83205dfaef9923377309a5e9cb0cbebb38ed9462c57f5ccd680e0 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt deleted file mode 100644 index afb078780193c5703fe106dd7d7b4b9bbf29c2e7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6d85d8a95a521c8b061c6fad96b934b6eafcfdedee8f261274c6df1e8e6340a6 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt deleted file mode 100644 index be2a59ebc4b065451ca8af9c91e417391dbb663a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:90d579f4c42e1475c3203f285610bd6f5c822b89fa52749261da870c06aad747 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt deleted file mode 100644 index 8e735181808f405c30034c7ce7ebad2cdfdd4b5c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:41bd376bebe1b75373c3192f86dd49a862e049cc10b02f194f3c456cfb691937 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt deleted file mode 100644 index f3320ec6f1f5ed87c8e2ee1030e8b33d9a6b0dbd..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d9131462a28f2e58a1739ad5d21b58ba227ffbf292b0edf2c0443ba96a374a99 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt deleted file mode 100644 index d935d7837cdaa03a529e1afff69f3f5689f5e6ba..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e1220e0d38fa67be82b865f2dec7dd11bc2699957e89dbb40a949578fbed1cf6 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt deleted file mode 100644 index 58edbe4186699fc13817025e15e6a4efd2bd8839..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7eec228ff48b40161fcbec64a4cadff1116747728da2330eb59f70724a9a3282 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt deleted file mode 100644 index 77cf29bfdfa9d2a1fdffd469300fa0c707259bab..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4ac14891430dbaba79dde73976f1a1f0583730cee4cc2b39cfb9582c7cf95f4e -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt deleted file mode 100644 index 524db46ba65d9947da33f9ac0380cc6ae9fe0a6c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9c622a0d3bbc86d17ddf3165935b34b6dd7588b5646c13effc38f1bcc3d5b260 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt deleted file mode 100644 index c1ad7611e495de13ea67854c72da72998e4a08a1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c1e1ebe5c2c89c64cea24a69f232d8361d7b3a7a165bce28e751319d77488da3 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt deleted file mode 100644 index 64823b407c38559814c9ce7e47f40e0d3bfe4671..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3be56b1725755e2460caac77da6aec7f136482f44903b54cab74080ac761f9e3 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt deleted file mode 100644 index c4059199770b39f0c0a1c275925fd0a6dc246a98..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:125d99c194b7bf50640de485ba983431cfce9c9c13d91fb73af9c7136ecec21d -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt deleted file mode 100644 index aee324ab383b3d6b5932db5f6fdc26d469ca5276..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:02321ef48ba2ffe5d27345a2322b38998fafa75641c062e4e77c8bcea68368df -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt deleted file mode 100644 index 78d0790b8675133c61d1cc56dabe8e27c95e0ff5..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bf8a58885da06b80c2beeb7e46f7154315eda833f0bdbddf5d0f7f962b9c4f49 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt deleted file mode 100644 index 00e54cc0fd48813cce5b95214920531ec0f2368f..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4c320eb9166625d644ff642df4ecd88ae20570a65a55970ddbd2bf90f86cfa6a -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt deleted file mode 100644 index 122b1ccf04a4b55ccc2b1383bc207d59974800b1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e59da7973f335a864d699defcfb5187befa553fa004b3589038f29f4a60bb9e6 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt deleted file mode 100644 index 61d6f8090d70cd9e7a8f79fe413790773c363a33..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7261e232175dbf3eedeec6c33eb212d28cee1a16a7d8ee7c122e297893877fe8 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt deleted file mode 100644 index 4475a352db475f99eb5422c73a0bfd1f7960d31b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f37884cd8a61f623ea50f68194fb73f3fd1c12471d3c82fac235a9e21698fe54 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt deleted file mode 100644 index 6ccc283bfd27fc95e37ef7c56e6a33c3921fc6af..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e9ea910292d70551aa3832b9782937f59e90bb6b868df6b81c6e6564a5b6b4ca -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt deleted file mode 100644 index b9a39fde2d4825e5cc3ee8151e3f86dc325d6744..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6524d0cc4c4fdec0b147ea24e91eae9267ec3d93746bb297b725481317d03756 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt deleted file mode 100644 index d58dd5fbe6a6f815bcca98db417e0a6ab5bb8573..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c20427c6f6fce3ee389cca34ed316f1fc0176ece849c639ddb92c6efc35cd730 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt deleted file mode 100644 index 6853ea3092b5ce261ab880e8536fc36518bb4d62..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e12e46b8566933b387300aaea50ca233b9a5f897ed2c2042104d9c5bcb1b1578 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt deleted file mode 100644 index f872f3c8aac1147021ca7234671e264928be2b33..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4e36c16f53707f18d23baf3d4fb42f3ede670a1a4c426caeb5c918de6149f0b8 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt deleted file mode 100644 index ef389a26ebd3e3f61650c23060050132da42e64d..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e56bedda086a061331b95d817e73396f2cdbc0d1e1a09ca321fd7361bf2d236e -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt deleted file mode 100644 index f83a6a9b6fa709b533a528d6b9a736d33a84ee96..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0f18bb8dc7c3a7c56319c4176c4e815bd017a4418629e2f9f9a2388d489d978e -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt deleted file mode 100644 index e32ad129dc4a7cadff67dbf48afccb323323c350..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3709b788f158a33c92c70864738c7de61ab811e656aa577559577f000e63bc38 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt deleted file mode 100644 index 604bcc7c3d88205622d485e5662d73b3a7d7fcb7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cdc5ce9cd57be8c8a8932c174e93426ee89d7098584c35b8b8e166aa971b32a0 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt deleted file mode 100644 index 678042310551383ee2fec7b18169e9e7a74d968e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1df0d0d909b6be8af47db71ae7be92d7cb2e4b1aaee00d2545b470fb16ede879 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt deleted file mode 100644 index f1d4c8b51def25fa08055c966a7a3ac8de71106a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9ab5cdf126eb938e6a27dd61e3c50f4d4b5767ada1cedf1764ebf557f492de1a -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt deleted file mode 100644 index 494fe08f679f2baf77bb0901cde94d3c1053eca7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2597d3dea3e0466e7a302b632722dc985fb1e2b9eab7fbf9a36d7b13085381ac -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt deleted file mode 100644 index 7ce6e3f8ab6226b65f2aa12a91482dfb2f38c313..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4fa86645a0f1e623e0375b1e00c0858146e23236b1d1ab7f37d73a0e69d655e7 -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt deleted file mode 100644 index deb3e4476d237240d53eede76c4cc3fa1c27697b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a1f8406cd6634b9dced8cde1804aa24fd50fbf91c9a965f3e44a449abd42ed72 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt deleted file mode 100644 index 45f4252c11a3a08ae18e3324238c718e5bb89ce9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c868e3497214c6047096b898fd445fe7e816d64171a5e2cb55d0bbc7f75fdf1e -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt deleted file mode 100644 index 3060453e8c8f2f91d1925fa0ac9a606bfd9dc1f1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:561eefd890a0c4741d0b24b126651f4d31db1f4e516e4fa3ebb5b103a0b3e171 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt deleted file mode 100644 index 4fb098b1434b6b2a64e3ac39d0f92b10f2bcf0af..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:da9ceff52ddd76d7333e459df0e912cf22f24dd67a1927c6c479b05793519b00 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt deleted file mode 100644 index 6ee91acc71803bd861fa76d2256664c4b5fc2681..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:08cd6c6e758228d9358c24a911d8b3e70c33f40c3661ca51faf968dc9e7200f5 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt deleted file mode 100644 index 00df95cc48371a92c1cecfbf5604d5ca134ce4e5..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e7e4e2c34f73d6d0bc0592c41b9dd2a6305f9e06fbccc2fabed34add47fa0fdc -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt deleted file mode 100644 index 440ca9d8dca185d2bbe51419c95e326829ffe08e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:befc7f44b7fcc56924d9d8183428eb11f51324920304af89b3492ec2109a9cbd -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt deleted file mode 100644 index 9f7f5df692a901f9e6ea12bc70aca2ea95e25679..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:75c1b704959b67b4ab05aa7f45d3425acbf2e9a01d773c92c3a721de973b6b72 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt deleted file mode 100644 index ebb6b98c330d8390912924b412d13b3dbd62dc83..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:31defe5c2b515ee619cf01439efab1d02122bd856115a17a75af9c67f0d17dbb -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt deleted file mode 100644 index 64cf88b378d49abebf3c32d221772df3496421a8..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:aabbc8f3b6e308c73bdd2498d066153174d7c595d424c12ec4963dd73ef177db -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt deleted file mode 100644 index 585485b3d903f2202a09f58219baa052110f2c69..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d55c3796d1eb6f80600622c4f79ff170257d9ce53f362bd7b579d4b4a48df3bf -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt deleted file mode 100644 index 67f14fe4c83807e0e7ee93162093d6f51f64c11a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8a0e8613fc36491553dda0ec8323b2fc04fe9251cb6c974828a593f332c9b8f9 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt deleted file mode 100644 index d4b39e49ff636d40665c6b2f3d3fc9e4aa9b0286..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fc1fcf0176f8b8ab73f0b502cbb1dd82621a311b11f7e9f4470d0308ebcaa824 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt deleted file mode 100644 index 29ea56b90cdf52b19f1c8a37b36cbc7cc9029fd9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2ca1b70d37ab68befd00845f60d36616a3e3605cfc27d484c7db2e90ce866c47 -size 102174189 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt deleted file mode 100644 index e9d10ac539804a5d4409ed800d83a091ae3a4fd1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0574f57c1a5951e1a3560f992bf848d35c7d8d5da6f15dec111634c90d04f917 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt deleted file mode 100644 index f8ef692f99dfc60219397b8ae9d6cfac90de58b2..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:25066d0438581d0bf03bf80b5f05ef6ff3a70842d6128e86b3eee1eafe00b95e -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt deleted file mode 100644 index c989bf7fd620844ea2e0ebe6ad3c231e578366fa..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5048254012f5547faa2c11840cd10195c76988514891c6cca9f40d6f3581f240 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt deleted file mode 100644 index 3edcd13c227801a4ea9a4f4c371d46299e9c6acc..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5d97c86096df03cb8a13ce9e1b035cf54c4bfce45899ececeddd33109f1de980 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt deleted file mode 100644 index 235424d77f8e56a973ee0bcbad46e80a288af96a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5a21816f6f68ca56bc3716e3b68e0c674b8cb4fbcd6eeada493caa8982d35888 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt deleted file mode 100644 index 354858a552cb1c0f195d59970ff1382ba56ebb15..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d4c5c7ebf0e5da8bd70830c53340075373eab91edbd155eeaff94b0c7d9a686c -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt deleted file mode 100644 index 7fc456fe2f28ec03eca04e03c76088fe71d24cdc..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a3fe99f7eacc7c0f2e8a0f190100e60bc8417708545fe461b5e31a82bf238e36 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt deleted file mode 100644 index 4c536794ea0ab2f77b455ff41891232137827c73..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2f532863d647e0d413fe87252f64a3027169aaed91578bf14859d98643b01c2f -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt deleted file mode 100644 index d6481dd0661c86fbd279eaa4f8ce120ae76fef71..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4499efb32297ea7ec6bf5bcdc6fccc4cf91f7d527787d12497ab1bf1e50765ed -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt deleted file mode 100644 index fc901c3ccd0a8034630d72d28997fc239bbe5c76..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4fbb8c9bbd143f2e6c667298bbe63334ea731e92c1c2dd0342b2788bd8fb6b14 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt deleted file mode 100644 index 15f060fc7fcc53e8dd383f3d3531f3b866d57aaf..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4d9fbf133bee32e02d4f7c9cdae387d9ca005de71264e3f6aaa018233d18901e -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt deleted file mode 100644 index a2460942ecc38a759de9a9dd002d27ab19a6fdeb..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f9ef7dbe1e7c018a0c72eb8d796bb4ee6b41b222f9ce46afeec927d905aa02a2 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt deleted file mode 100644 index 6664058882f49e509fca2bf7d4cc659f40ad71c6..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1a615784672a7f23358fc55a7e46b0c7dfd1e7ebd9521990338f3af491eeacf2 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt deleted file mode 100644 index a034b7b8649db1eec8455854e8f2c484efb6ae73..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ecbb888a6207e34994f6d86f0d88460883111d2d5a11e429f23448b4b1960402 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt deleted file mode 100644 index 3b39e652f1c88835ed1263d35189574d6cab65c2..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:477029271bacdda0dad191ef1f26ce46c8747aaa82f0f3bf0fceb8562e979f19 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt deleted file mode 100644 index dae138db4a299be73a2c8b08e74b2117ce234e1e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6e95c04cc8240b367ba86c75f3d3ca141428aec74bd90207dcc83a3a7eea3cbd -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt deleted file mode 100644 index 806dc2c2ea340310f06d13f9c8947eff4762f93e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:abe57923c0f8851b69c80799584451520b6dc0313b29f0cc64d7f662120a3455 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt deleted file mode 100644 index e7fc32f949446114e45a673eb0a142f5999c93d7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f8904fdffd8a48ddc737c6af40c88521e37cde9cbc0f6002b6642a977dbf4063 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt deleted file mode 100644 index 4fcac6dcb9aa8c15972f1be2983e48f8372881fc..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:72e9e320c4c3def2d7a346f3fdedb8016a9152c0c13544428e85be7ab3beaf8a -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt deleted file mode 100644 index fd5010846256520a9d3645c6467469fee90d03ee..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:45dc12c1822db6a1814d8e7144ed94112b088ca5a15953c28d77c3994b824fd3 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt deleted file mode 100644 index e0980216218d7ee694f0a4f15024afe241946dd1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fd2928496dff2d83843f641bd05d237b5a35055f062de88aeb801aa697614c3b -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt deleted file mode 100644 index b09b738b679b2823de1ee416426dc0d77ad38fea..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7bc48e154018db4ca6bc4d064cbdd9158338b93232e50299a9ed480592009209 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt deleted file mode 100644 index a4294219d741189a77235b8f3f99ad79c59d493b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0eea92292c719a8cb42156da094218fd1e8766a334df5678ed3a61c59e3d3ca1 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt deleted file mode 100644 index 49d3034fe74eda1a629c366d3fcfd3db57caa482..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f0979cde69c4a5a8b06cf305b67b04e8fc3047fdf3202672ae86eb8344afedaf -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt deleted file mode 100644 index eab741a29ce42eadb415014487d9cd02bd012b98..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8e9f8bffe32f923f3563c60b2b4af86c0e64548c4275eb873ee364927cdb2caf -size 102174189 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt deleted file mode 100644 index 25fd4ab738bf9da49d8438491fe0e4ef103c3a96..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:68439d169a2396f4863ae9c4248eaf05da886e117c06db7a2466ccb3f18479b6 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt deleted file mode 100644 index 4969aa1210cf037abd3f500f10e08ae9fee9c6d2..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ab261cc6ad987e2cd26379cc8bfac988c497b3147689a48f6154ca0a8085b3aa -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt deleted file mode 100644 index 95ae3304265c01e327d8551593a17b3f72f91246..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b9cb4c93374f3952fcb293c2488a7f0ec1166f0fcaa7d26472cb7843a6a35175 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt deleted file mode 100644 index df3d3a1a0e34e2d92accd101801e040d9fb51265..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:89b28026b07e3d3048c1e6875bd683a345f0bab3400dac225f4e57ffbcdcfd8c -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt deleted file mode 100644 index 1eef19c2dffb59770a604343969b63234ccaf0ee..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9148e67081298de1a5981c6656381875e814c1597c8c628c807cdcd9203c6bdf -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt deleted file mode 100644 index 5f513eab5895a5721c55da2a618aabdd2229649f..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a8586a4dd22c03e43c12670578932a9cb40f07c0a523d10c87467e2633fd3716 -size 102174039 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt deleted file mode 100644 index b36a05dcf61e1a0a1f11faed3b86e2e5625ecc1e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fdad0179597fb079be3c79f4307085663aa49f6a7b4ae1864d52e4b8ba1e9727 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt deleted file mode 100644 index a01d67728a538ac94a7eb17e6309c6e29cba1bc4..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:987f2b2991c23999c8a87df4d9f8f37a27f03c10ddc00bcc5c9b85494dfcff0e -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt deleted file mode 100644 index 0113d15e661214ecbdaf59583e53fe63cb429fff..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:280cc142011be0d8b445298526cad9b5a51b347cac6b35bceba1c43e3cda4767 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt deleted file mode 100644 index 8fc73e516283543551aca83db9f1b1fad5dd0149..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:dc08a99cb24e7cbb4d0d88d3f784aa56eb0ba1e2da18c19a32d91db8a27c6956 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt deleted file mode 100644 index ceb1113afc74f29aa2b6ccd8e0fd5c252ccc6363..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d17fc57e88bebf997b8afc932df7955b8e6ee317fb8749d91dd3e7ab9219a75c -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt deleted file mode 100644 index d458032ff0c0b60f2fb43c988960cbfceb89b388..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7ce5b13417b253cada971d757d5e685a64537657942cf16f74fa4e017dfe1e97 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt deleted file mode 100644 index aba3a0551b19e15c7b761c9d97a65331127a1464..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1829fee9e91e12bd96477f22371c8753295b5afdf806d20476f21b24bd859438 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt deleted file mode 100644 index 58bc6d614f0ce3a597314d169e496cd1bc2b9c7b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:736e2a78f862310430f05767c4a77b1f998d1714965491df39e396c0feb8ca38 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt deleted file mode 100644 index 0b229c43a25d07a4b1cdb1c257568570d50fb8a6..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3d115a28d759138f1972e9ff76c4b8e5c3a02855dccee49bea96b2681c234669 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt deleted file mode 100644 index 181e02fea143d81328886a8c8afac5aa7b0f48ba..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8841b1c08099307d396378495bcf4174e6778b77781092966b0c6cf34801f72f -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt deleted file mode 100644 index fd5963677b7e8814602b5532a199014fb8a0f45d..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:605af5e677bf792961ad890f087c00d59313f1e7ea5a636884e00086d294d8d7 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt deleted file mode 100644 index 30a66c0727c1da779487ba6ae9c7c1cfc7860d1c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:dbbfed5c777baf786500d06f9c63481594a3b2da87790b8bdedddda72170d8ae -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt deleted file mode 100644 index af92b646fe6f3dd4d0853019d83d46dfaeef213a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5bce7024bfb7e834fef12358f84c4872738bf5825994f1881529ee48d8d330ac -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt deleted file mode 100644 index b9d35c7a521377b1fd37e41a1243581114d7fd4d..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bb11b148fe7281fbf16ead3beda70ee4d54bacb4eac50b8712f554dd4db7579a -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt deleted file mode 100644 index f0119258eadfd5dff78389a36d467e946dff335b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8080fdfc3ef4d017f518f44c70a7c23b32bdab2547794e06551fd1989b1e96f8 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt deleted file mode 100644 index e8242e2e2259aab13709ff1e59782ad6f7adc7f4..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:322130e46a583ef8fccd15d1366862e2a817e5b1b161bf9ced06f066a5b16108 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt deleted file mode 100644 index d3ace79794c6b2e2ad9f7de17656c36fd6913503..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:889278aa1b70878e8dbeb8e7706dbd9e5ea31f95c213fd2e3fbe4f5eda53fb0e -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt deleted file mode 100644 index 29d7fed2ec6b0dd401b411a288f8406c4ba9c35d..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4c8503e924a38b30fa1afc0435a38ac037f4d518de2968c0b57868da654cad07 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt deleted file mode 100644 index c8de2cbf9c8ff03b375916bde4067419fb6bb75b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3ca98e595cb33e0bae9888bb32b5aa40032d0d3c51be65381a97c359bea34f46 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt deleted file mode 100644 index 5964d1ad0e846212d07f1845fa462f8d30e9d92c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:63638c55e1b55130dae9c7427c43156b53ca96ea5d056d9256b08c1e6ee6582e -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt deleted file mode 100644 index 9b096da58bf7cc0bf8990b039af45fd19e3c90ab..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:acb45da735b8f185a7328088b072231ff188dc9c5ab115783863dffbf29e03f1 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt deleted file mode 100644 index 2df783214abffe50f74cce1b88c5a559caf3f331..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:da06ec0447d807da49918e61151f5fbdbde660d72b7d2f5d8c6d9e366523ea8f -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt deleted file mode 100644 index 4ac4006061901082aec065bee607ff6e21c702b0..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:61437c58f354cdb090e8b7a97c2c519ab484e86c525fb055e9aafa4e2fd346da -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt deleted file mode 100644 index 1cb682233d1a31107db8b45a74ff0d0eeabc6528..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1921ab535b9e219bd14de981354f0e0057614919f4605f47d4625f9f08b3f49a -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt deleted file mode 100644 index 2e6ece3f3ae100ec8c095d691210250ad08303fa..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0097ab9f87a2b38cd108a2cc4ff6430dcd8b0bb481005b39c66d113683026b0c -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt deleted file mode 100644 index e3d14e9862bbf3cdbe8831080211a09ac47f5e63..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:64b5a270b5a661861ff1d562d0a4814c69aea8d1a87f41e97eae36f8ed781943 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt deleted file mode 100644 index 8fb8fdf03c421c65dcbb21a7f0e56bef01baf3fd..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8eed3479c8a6affacfa20d5a663b6dd2fcc2173b4be97590a7bc2c0f8f96c2d7 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt deleted file mode 100644 index fdb7a4494deeb31ecf72f120fee384bdc30448b2..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fe885d5ba4a92d7d310dee1c326b46e98e5129671ae3ae94a1a6c7aedd172554 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt deleted file mode 100644 index 12a1a1c06d33feb322bbb6c8f916b57a92f5645a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e38cdded07c365e24cb4317fcd56f19454a78e5ac5a2618af49cc64f64b68b9b -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt deleted file mode 100644 index 6851e5bf0c8964f3c169a6b5f7a48e699af53dcf..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9008a401a898e5f82a705a41758fdddce2aa32d3198813bbdcb8fddbcdd973d3 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt deleted file mode 100644 index 12d2723fd2335114d760ce5bf78c1012f920ab94..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:67c7c69cc98d20ae664ea4180bd5a1e7c12e53d0ddd88be926c57c1488bffeb7 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt deleted file mode 100644 index 050e1f684d3ebf180634391bff53c1e9e9bc912a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:50f2b8595493a54bb838b52ef8c303fc37435b49d68fba5413a6a63d6671aa2a -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt deleted file mode 100644 index dab8a6324fbd4da1dbecad1b80f926ca484c2a15..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1d9b04ac23a2d8a04fbabddd5112e20f1c3f5ed94d18443bf9a9803cdbc15047 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt deleted file mode 100644 index 0c545bae221be642cea04f741e8510a503e7d85a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a2192fd05ed8d9f0805bac0af5dd78267646f5356ae926526738e394eed81216 -size 102174189 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt deleted file mode 100644 index e3e6b9f008bace655ab192a28859371a4fa1af01..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c9cd98a66845a33f74a91b08414dbc0afa8cca7623aebb0188ebbbcbefd32062 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt deleted file mode 100644 index c4bc48d2ce99cfb5dfd82cef26b6e9b3b5da2f89..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ade0562fb05809cf99362988de635b240266a501f349576f7e08e7327ffd634c -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt deleted file mode 100644 index c4fb519dfa49166f1bbb7e8ab9c49de1c60c875e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8521d8cd85e4e229940154147678b67d3da1d87f1a6604a68da7de4d4c59731f -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt deleted file mode 100644 index c2a1ea4755e51b49090c93590c40a879ace20748..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:efecc2daa712aeda04136762921bb1804a62f63f8a2e5a49c739c56d0b3881fb -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt deleted file mode 100644 index 263f37d34372a78a38931e4f40abcbb2cc660f34..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:49bcb04939f204065b2a09eda8787699e73a717937135e55c2899dd9ece907e7 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt deleted file mode 100644 index 5dccfb3f00a7d2c91f7e80f76df07be70771fdaa..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3c57c9b5126484c533e79f58b0c5d1463dce124cb9ce8f9e8cf87189276ec722 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt deleted file mode 100644 index 508f6f43db030616d68fbe7606352db0ef1da504..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c23f2e8fc230aace351a035b22e0fc807dec3b915a76024131b3c8ef11eba05b -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt deleted file mode 100644 index 3f019713c4c98197f3a2298b8c7d7d745097e4df..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5815df21f8b073efcddc30d935402598700c7ed13680e0b716150257205702e6 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt deleted file mode 100644 index e2c9340817b979fa6a45c62cc5e17b0f932d4ee8..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e2fbc1883b28e0a47e29c2fecb2ddf0fbd2be528fcc9c54478adc74362fe1d0d -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt deleted file mode 100644 index be9965e00d8c49313ef2b9987024c95cb0030984..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4ec0985b67ada8e0f36cc508eeca9d726370f9afff64459f786a5aa4d9caf83f -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt deleted file mode 100644 index 842e553935a80268c1bd96161576ea04f62333ca..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2c835dc9cfa772caee995c1ca0513492116c938df8aeff3a33a1836cd8d3c761 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt deleted file mode 100644 index 7ccd26b2a0ff7dba53178864efce3cd02edd9696..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:70a1b12f796dd8f258e6bfef3ee927375f413e96cd645eaa87129a81df3f346a -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt deleted file mode 100644 index b664e942ca95117d12d65680652cda726608885e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5319c39e968d0ae9b3b4841cbb47030da658e717859286d02075a7252242fb6d -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt deleted file mode 100644 index d10b55ee045f60d27539366d604820cf69c80725..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:988cba39f014f625115438a8a2a5b3d80fc7802689353a42dccb2b12e413c7f3 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt deleted file mode 100644 index 83b75281edb073401f6d1fc8f0604d9bfd847f12..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:030e66668e2081a41c80fb82ae1d6b55b8cfb5a2629e84d6ce02a876c9c843b5 -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt deleted file mode 100644 index fa84ba665a31c824a2cdbb6b744e3e4d2eb8e5ca..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:95369b424d08613d6e4136e96f12acca1a3b06c2efc3e30d51cff28e5238e5e6 -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt deleted file mode 100644 index 5652d6d8e5006414c8c8662ddfa2d67d1c2964ce..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8ef969b5cd4f0bc156b331554d3f1a03c34737bcdd8d5dc9e29378ae5497d01e -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt deleted file mode 100644 index d6b6b67392bf48a477230b9f227dfecf8c53a2f7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:64f0c978b62ce92dc44bf599f70e9c8960d2a06fdc019b1176fa3ac3360706ee -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt deleted file mode 100644 index 958ceb4ec0ce283bd78c831d5312ee406afe72e7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:da2e1071ef8e5dc105d84a365de37838e413bec527de9ab7a8e68efb7aa0c2ab -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt deleted file mode 100644 index 6bd52d2326054ddab5d08be389f6b1fa98495463..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fd856c7b57a94f84306499c9414b17277c0ead46dcb44433921bd8502b57deaf -size 102174189 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt deleted file mode 100644 index 96ad44d8ffa6aef01f9270b391021932c1f5a540..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:49a1a8a4173c083fda65c8ff0a45aa722f0040f5dea8efa305d923a3d879a256 -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt deleted file mode 100644 index 24ff13e6b6a98725b6b6a0a2fa20f9613de0c2b2..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:30cfa8624733194b4026c589be45246d81b3f690a1fb6b5b1cf62c55efbe868f -size 102174125 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt deleted file mode 100644 index 00a79aa690135ab284168a57c803cb001aeb400c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b2ca265c6431efc8a57bbbdd0d6b3124a4ccec6427b076f7dbcf49d3791d47e6 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt deleted file mode 100644 index bf899815ee4ad49ccf21bcb9b07a8a6a347e14cd..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1255cb0358935e5a8c751b84cdf4d2d7fd75a97b281f458d930e586393d85726 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt deleted file mode 100644 index 7a7924f65546f3bdadcd296afa7244590479584f..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:31aa0ac6f89da4e3d0ee85071874256cce0393680b259594d6e4ce51176d7a7d -size 102174061 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt deleted file mode 100644 index 1e93fbc8e2a8a80263aaed9cb4854217957d1142..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0ae4639a3f0f437114a2a6996aae6aa257dbe2b82987bb78a127dbd5a1d97705 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt deleted file mode 100644 index f37d1eb16a4c98fe4c8c5de2ae7cfd04b83cdea3..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f558d74f713b1975b7dca4cdbcd69975471d61c8ec692fa5dfa762d43e7fd691 -size 102173997 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt deleted file mode 100644 index 61c85840922e7491b317f00f23c4051717baeb22..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:befb5b2632d3ac002c56d5e48f0d18326cc4ec9a0dbf4481403cf3ec3ce2ea42 -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt deleted file mode 100644 index 30c684b073b7e85a76df30d2d9c0ed1dfea49109..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d2376b2ebb321bfb30ebfaa68730e3677bcadc3722ed3080f2a5bcfe5b1ff6fa -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt deleted file mode 100644 index 08bc2158bb8dfba967fa8d29ae722b92ebe83276..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0820921b0cd92ffd60cf83c0fcc561f111c9201cc89d4b01d0346c6785db0ded -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt deleted file mode 100644 index fb8db6506ed9e5b6e464be93092733a3cb456e31..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d32f8e9c542491be781e3fb206c41cab3cc974f6d6286c888fc51169fbbcb153 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt deleted file mode 100644 index c2fd9f4183e5c1f1bb3f175dc435a84dd1fdcc7f..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:41525a0fbabe8d8dbec76c7f97dc087079780ddc87eaeeb472df8eedd15be1eb -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt deleted file mode 100644 index 51bb540b198c960a3110a92356f7a32dcece3f0e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9e44bd1c3a81ade953d973fd87fc4dc94d9d1e58a5231046b4a4159fcca02735 -size 102173975 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt deleted file mode 100644 index 6caf2229bd3e11a0ca5258f5436d7ed38388fc71..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5218357a4ad3125b4dd1e0056abd13629cb90fb84798772e9925c12466797e40 -size 102174242 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt deleted file mode 100644 index c81e204feac473c1154fa695109e32d29043957b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bc4aae4e928b7ed37b5e875b06697ced2de1e397eb79b9814c9b5548f05a6b2f -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt deleted file mode 100644 index 83d8c953be3786b4e160fa058c5ebf97bf8c0985..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:779d832bedc0a2bb60caa447c9e8487660a7e334074234c55de2139249ce684c -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt deleted file mode 100644 index 1a4c607106d712b2c432e01b7965dd4695e17655..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c29e82704e877ace5654d5bbcc74d1ff4db71c527348137e9a535bcbde2861e4 -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt deleted file mode 100644 index 7798073bdab3bce263cb466a9d2cbeb815038c15..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:adf50024e9b4ace6d2b880c0e96e31a232c7684afc624ffa173f23f757845dff -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt deleted file mode 100644 index df4e23c25582abb3e2e03be1c372471bc2c51b3c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0608e9e7374a5e8422d38ceaf3f8ffd5b390ebee583b3a654e4ca5a33e16b968 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt deleted file mode 100644 index d8009a4a8ae9af27957e4cc3000eff5e33c260ce..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d09b1cf76d2f9778f4e6fcc69b71bd0f3761b8fb3ffe5d64489b974d78797b30 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt deleted file mode 100644 index 5f2303324cb98697a7fe5d09845a384640725bd2..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c933e86981e562d68c19b700acc70f478596b1db49d51f11b2fd17de21638fc5 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt deleted file mode 100644 index 4fe2c4862f5fadcb8e59c10b72e796f9391f50a8..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f045f60315e5fea89dc202d418eaa6b0117e7ce0bd14d2cd09374d8b1e0fd450 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt deleted file mode 100644 index d3cf6e9715b628bdc301bca104c4e14c637e6a5a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:33bfaa2cf77ae35eea54ebd681698a6db55fbecb136813cbf7b253224e74d67e -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt deleted file mode 100644 index a64fa37e6bce6487e799c20a2106891409b58877..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9be9fcbc4d7f7fbcaf52fefe85f92f3f7ff59eac021300c96bc0240830eedaaa -size 102174039 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt deleted file mode 100644 index fa09005888dc2c8e017ea08abc510f89d159c5ad..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e0d74f2d531c3bcd452f252dd259d233bf8cd3084cb135216475d78c13b18875 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt deleted file mode 100644 index 650fed241284824b01037cbb7b8648922a90edb7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:39b6929aad1fbaed9d7be6ffce4601bcce80df89a508900d75c2d11b97c5afa0 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt deleted file mode 100644 index 5472883b0a6d1bc5a6878ca0ea4add38abef38ba..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:423bb2ca7f48cd4a5695f40e13ade51db73f3a039cbb1a739425db7516aa7a9b -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt deleted file mode 100644 index 64a79830a659486c8219a7f42c05c232a1a2f775..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3d0ccc27276534df1b8592fb3d989d7cce1d3b1c054a22068fd31a4f742f8002 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt deleted file mode 100644 index 40b6cd7fc4efb97f2b83d4497e6f794e7f46130c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:70e808bc1db3733ca60a0f4e759cee0167e85432c74fe1b05d3d68a12499d2f7 -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt deleted file mode 100644 index 3384b8d916be6d2ed2f38b19da60c577b7b8e5b6..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:aba5d380c2d2bcfed5e9492513d08c1269029d892aa21f825ffa9ddc37e25f9b -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt deleted file mode 100644 index bc2e184b9fc64533ee269f2615f576cbe6638c71..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:79a2a46714033cfa3cde6fbde2cc84604aa7bb5587141f96aa621937a31817f2 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt deleted file mode 100644 index f09b207a89924a70570d2c1c0fc8794942ad1951..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9bcec69902ac16c673de1559bb8d7a58c68ad41376ac84362a32c0401b0ef950 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt deleted file mode 100644 index 6cb8addd760ad2c1876f863f11efbfc64f6a59d0..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c120b2758254ca2ac5cc86311cf0ffd56e2aae096db540bb3c8f8b103135cb38 -size 102174178 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt deleted file mode 100644 index f1e1a41d41f3a0c040cf3d56b0f38a2404b0ca0b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:970031b88f2bd351616331a493dfc5d5aaf7dab1777aae19363a620d474810dc -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt deleted file mode 100644 index 82999b0221fc14fd256b9dc505d4372f16d22bbd..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a69d561a21fc83fef80fd48a5e07454b65b2c2c853eb6b7c52dc4d7d37fa164a -size 102174039 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt deleted file mode 100644 index 8e0f575294139df1a2a95f831c8be70f086dc9a5..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f27c374e769007faeea74d7d158b2071275baf5980e0ed37d4235fd19196ff31 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt deleted file mode 100644 index 32b7973bff1bd0c5cd34ce582b5f00492e8c97d3..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6ce196dc33eb41831e8c811048377387b6001b99c9150ea64e2ee0e48e0f6ebd -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt deleted file mode 100644 index 5a8db92555fc3010572637036c0d6bb8d142950c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d91740fd07a9a048fa31c54065f7c886746e36cdebb0b99188abef46c077059a -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt deleted file mode 100644 index ae70bf343e1bd6822f63fb675005177fe84c5778..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f9c376f246b289612de5f591a2ed1846a3e5d0fe113a5b342da896d2e3827b58 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt deleted file mode 100644 index a4238642730ca41a9bc297c9be0629cc1ce15fdf..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:102acc459ef3e640c7044455f7c696458ec6a6e726e6155a7b4cd75dd15cfafd -size 102174178 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt deleted file mode 100644 index 2830115a86d6289dca9e472fbe8ef52e726cd3c7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:902487fb7eadbb5d32e4654a7558025cfd97d37c94d36d7a63e22400d0d55809 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt deleted file mode 100644 index 620ba751e2615b84bbbe321d37e8b4430293fee2..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:47b57635620a183a0369b53c5fdc93185e0bb2671832f380549db46f8595ef7e -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt deleted file mode 100644 index 12b152086d4b8b677d9b2ca71b1aba112b319a8a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:847d2445c07f3a511a6a6107f82840593a4daef5e67c4e13ce2a8213f2c5216d -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt deleted file mode 100644 index 43ea7d55e72bb2df259775a5a35062a61c995438..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d61d30bea7f3cc5edb2a0e38435b73dc1416e1052a938dc120d533cc9c5f00f4 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt deleted file mode 100644 index 39689341e56fdcf6ea6c292a84043ddfb1f576a1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:065c91937da496b48baff269ed1a226c226b2c87f78109b0d4d4f8bda3abd41f -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt deleted file mode 100644 index a1bb26ef557c71e5e179dee219f1f3550abed507..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:67a2727f7d03365f008e88e8caf7ef37379d903620e6546c17ebc2362b85d28d -size 102174039 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt deleted file mode 100644 index b7ed130f4effd1343fa31cdccd6d10f6b5402b23..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e93b9fbb6f44d499a81f38cc339990b63c949f0186657b0e40870db23204a119 -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt deleted file mode 100644 index be892c6d0d0460de09193613f846f3797b89876e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2ec634489fd70f40a7de148238c95c385d0291812aec5ad49fae73c9c88d9cb7 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt deleted file mode 100644 index 92daaecfc6eabb3f9c7f65d5eff233a2cd4e0365..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:301dd8219e1c03ce000690a51a9d0b2037b399c4d5e762d886b65552740d525d -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt deleted file mode 100644 index 70c9c1c1071c89024ea69c4846afef4a2a228e2c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c5950b8cec565b39ba5ed1511bcb273915e2e9fef9f48a414cd0dd09885b6e05 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt deleted file mode 100644 index 75949076e7089c73c1af5b0ecf21bf9b4633d3ee..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:95ce04964cbb010a8c8887cf539794ed2a152bd7362e69e83a371bf5d05dff5e -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt deleted file mode 100644 index 24feae9a6a79e54dc3230d1b087eb62f733bb42c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:62326c64da36b6c35849d40b3d65898791851437572c0dcbd48d256f286a108c -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt deleted file mode 100644 index 7213a5f74dc8bb28d346389d4517c25418244686..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:dc52b583953ef23e1894b1e18200323ea1087e94908d2b8cb015e172e2b44b4e -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt deleted file mode 100644 index 25c2050913fc89ff03fc2af24a0a5aacd59ba0c7..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3742712930a040fce459dfab460d47e1ee2982c3a89793a77491dd92abf6d6f4 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt deleted file mode 100644 index 25d4760e203a0bf750460ed9e8064ed2c011a026..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e524418c4a726c1a17d0012bb1b4288f78c99120e03ff517b80d55f7ceadbfa2 -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt deleted file mode 100644 index 3c48acbe401fc2344c9f80cd4ea58c99afc54828..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:307b12aaec07146613595f3eae3ce4f5cd78279a4fc8b976429f8b99f92d5387 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt deleted file mode 100644 index 5025a906af6dc58b70bfacabae78644630d99335..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:807471aa2fb37b8781d53b2dd97a8708b5a57fa2331f6f160e1fbbd19b51d6cd -size 102174103 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt deleted file mode 100644 index 410e9bece628eff56f0d86143b3ee156738c4434..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0feb96870413691f30a74cc100f519b4ce27d5bb95ce63a71d9eaed6915ca4ae -size 102174178 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt deleted file mode 100644 index da8bc321b31f243268fc75abf748e4fb3b43ed94..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:122e7e9a2dea64f60ba44aa73f3f07dc41b9f473b40b8f2d726d566e8859466c -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt deleted file mode 100644 index 668d1d6d79a9af5a393ceb3334e3e176ad9edd89..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:560eb0fa116849026dabd7c92ec4a137ea557f77987a5ab38f91008a26bccbaf -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt deleted file mode 100644 index 77d7b55b16f55aa68cf157b30c9d318dab515ec0..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:995b045a3dc3ee42863808f62d1be969d62c2dfa3e5e71d4533ad7f9e24f87f7 -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt deleted file mode 100644 index 731360f94aacbf999e59b56577e1ad0fb5a65f21..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3fb072aeb2c6b33e15009a227a71dc1836969943608f83c3853e540a9e0ed9be -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt deleted file mode 100644 index 183d8e64d7a7c8407148a63cad780066332b41a4..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e815493bf6b0e504138b97e39baa18028338a1e8a48e69bfe56a2d721a5d600c -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt deleted file mode 100644 index 2bc577842aa7e56974a91799a40fc753725f98be..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f57e25fb9dd4bb7096f48b65a11ad86ca001b4efd054d5f75b0ba3494967a2ef -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt deleted file mode 100644 index 04eae37490be68e1be666c6f5475ac5167574ff5..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:276e192c21c0f7ae1d4fd28665c1f11030b3ae44267f29bebed3a2365004d49a -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt deleted file mode 100644 index d864d1723e1e0c6d3a91083012ebe3c84192751e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2331480f544e3bbf7300939f3f4e2624f90dada10f744ad89b44c29b67497739 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt deleted file mode 100644 index a538ea36846d05570a4696705ce64a5967bb3ca1..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6b9f0bb15d2c7225ae0ec6f6b50e67ddc9b3655208d8acc3914b6fe021c01b7e -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt deleted file mode 100644 index 2a10cf0f6e04d7be97987982ee21c9198834d322..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b6e46b6fbbed27d87d35a98e18e1fc5616ab7e77d83546db62544575f956e7ae -size 102173975 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt deleted file mode 100644 index 8bc7d63a88e5ed8054707f8121eeb6ce7f3217dc..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8b0bd426242125ff331a315b9c3869f07260f0b4ab7b31a9f9b796a3f2ad06cb -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt deleted file mode 100644 index 89c5c411bc9842d9ef208f568385cd41f6193c2e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0562232e1fd704a41e9bbbbed5d60fe596baf91e7d0b5e161cbd30b58b6f02c0 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt deleted file mode 100644 index c9e353503c8c61eaba1c5059eb4814f4efe0eb57..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f900c14ce2cbbc78cd3249ad7368c4f521669c972be98bb023579dd020a197ea -size 102174114 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt deleted file mode 100644 index 872731431f66b55a1d9e4fd19a06277ad8cce2ae..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9c18393a37e02753e483120a27f6df5f33c6f8b44188d8d5cfff490862a63519 -size 102174178 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt deleted file mode 100644 index ab6cf8cf56b997dd3c7de28ef6c16edb5f3a94d9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7934210e1c7691499bf78534b9056603efd731233af9a202adecb3504a618bce -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt deleted file mode 100644 index 1c8e6cdf723652518899dd24e8774cd44f317132..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:68b60376a6b1496cef9b6af06f38e8a2bbd7dfde740c340e871987a2c92183fc -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt deleted file mode 100644 index bb1064c533dd1ca0fd9fe36a0858749d3a21d39c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:33b6542bf0dfa0071bafd2215f1b7f29c04d41031729e7579a716c3d83694f88 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt deleted file mode 100644 index d5879488f14b25435095e1e3b2f46b8c361023e3..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d6235be0f2e89cd415fcf23b0bfc493f5c3ce65417cf46e3757112204ad14aca -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt deleted file mode 100644 index 20e4cc7d7288b08352cdedc7660bc3e0ba1247b9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:32c1e17262d4b5c0385d10785705c0c2bab60dc6c3bcdf15f4297013bb2bfe11 -size 102174178 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt deleted file mode 100644 index 39401417b31d011ef2734f1c0b7fb0934af2775a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:edc423c4cf6765dac070e37144704f987e0394d9a2c88c87a91a19cb13516d8f -size 102174178 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt deleted file mode 100644 index b2761eb4d3e0f6efdd03b3b3abcc77b8b8c47f62..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e159bedfe574d3fd46e797c14d6ea6ab4c0492c068dd5851b58d041485a40ea5 -size 102173975 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt deleted file mode 100644 index a636d9f23dbaaa6a0a253a20ca3bc31cda4fcacc..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0380250ccc5ead0c107e14c763744f68d298c114a465a2d45cbc004fa00292c5 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt deleted file mode 100644 index df7b64c39d95226d137b6c3bab7b8d4aed31c38f..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c4678bd0b51008b1c6778949a3a14a694e34f8e203c89e93706fee33b8f7101e -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt deleted file mode 100644 index b19469df19368aaa8d7d25d66d4ff6a047625083..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d9b788060ced1871243bf455c53d016f880f3ef5dad269e3c8cb1ac46b88aafd -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt deleted file mode 100644 index 90ebbe57176e0303936e1d07a82f73dc2978dc20..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:64ffb260890c408e3f17a4b4469db8a9010c4e1c9a7c80ad68a697f34dbe2eb0 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt deleted file mode 100644 index af5bf0c7b379407a20e8bc7f2dbd6e6c8753bf46..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0b1828c98969f702d38ac3537890cca2bf7cf1a70ea82f6bae7954766745e1e2 -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt deleted file mode 100644 index b406a689827af64fd012151f3526d7b7f5d7cf8b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d977318314136ed6fd3aaf5e4f49b1d67f61b4602add115658a36456d19447cb -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt deleted file mode 100644 index 9976b1692773bbc41d3b3660ef1be2b04ad96cb9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:20080daf89ba5cb236435e9b27c2630308a5e3f744873f6169957044b415db62 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt deleted file mode 100644 index 8068d55f83e5f5c2dedefe35ed33d719faa49849..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8a1f3398d7478af155f6f73dca3fcee1a0777bb28ed30b9dea398ad1c331607e -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt deleted file mode 100644 index b8b81550926f00006527ae011f22c6dd86b72e4d..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:64b3dd79bbad0452c691fd37d7601a48376d9b0e2be18b904436f946e772d1e0 -size 102173986 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt deleted file mode 100644 index a3f06fb6d863dc4fb64b4d2d56966c7c8c20a5e6..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6e50d2f99e504420bc604dd4c6df50a860ff1796bdc7ca7cd2c42d7a37fa4bec -size 102174050 diff --git a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt deleted file mode 100644 index f9582de9b3a466191c337ab97ed71732d016ec3c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9fd981eff334555c6940ee28e156a5af9d938f7ff41d9e7fb9d10b8323ea55a8 -size 102174103 diff --git a/2b855b9bc4opt2/global_step70393/layer_01-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_01-model_00-model_states.pt deleted file mode 100644 index 913032e212f7b72d447347c49db7f9f13d2c0495..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_01-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b65878a1dd21682bc4d6e6c4e94f05e91cb484f256d4133a025f0c9fb9ea4286 -size 268043523 diff --git a/2b855b9bc4opt2/global_step70393/layer_03-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_03-model_00-model_states.pt deleted file mode 100644 index 3a473bc80859cde92be0dfab642b9f9b739509ca..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_03-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b181e8398650ab94aeb634b317f696364bbb23af4b924f4e8240587e71fd51b3 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_04-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_04-model_00-model_states.pt deleted file mode 100644 index 52e3d997665d5ba88b8071dba5063212448e7a74..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_04-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:52b3cb668ddd17f15975adb0643eedb8421d5312f879e571ddf008abebf610b0 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_05-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_05-model_00-model_states.pt deleted file mode 100644 index 9a540d7a61f7259a73a013a8efdc1be2953e5872..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_05-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d36bc19164e71f9211417c847046f311eb155b3862a6470882065a642ac3052f -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_06-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_06-model_00-model_states.pt deleted file mode 100644 index b93db04c81edbc2881db28933b295ce09d5dd46b..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_06-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a3136618155ea4c4d8415f6d5fb41b5e8caee4f644af2e095aa7dec1df58eddd -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_07-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_07-model_00-model_states.pt deleted file mode 100644 index c9e30f3f74aada8b4c85857e0a166d5276c8f094..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_07-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e87d683ff7f41d4da15c531a484f5ef9abee240eaef31a4f72a74c8598d61dc9 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_08-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_08-model_00-model_states.pt deleted file mode 100644 index 5d1c532bd83ec380c0b08c89a60c72929a943ea9..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_08-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2a0f330a7506b14587f098edb6c338fff43a7895d5f6340a753015e77891dcf5 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_09-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_09-model_00-model_states.pt deleted file mode 100644 index 9d7e0ad37f201d0d16d4b3671d59118fdb85555e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_09-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:79195a8e9ca01fe5590259cc634a5d5194f314c95a555f64adb5f48a4cd4f791 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_10-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_10-model_00-model_states.pt deleted file mode 100644 index e85e4a67c73a9b9771cf6d253cfbcfa1cb692a6c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_10-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7c4f00f66693bbc5134aa872ac03ef1c64db80fe1bb300f13e45433d97419644 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_11-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_11-model_00-model_states.pt deleted file mode 100644 index b46eb85e08ad3fddec55f4c2c6e92e4c622a7f2a..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_11-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5e61fa93d4c13d21946b6561796108695dcf04e6672e5cbb8ccb99690cb0b6e5 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_12-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_12-model_00-model_states.pt deleted file mode 100644 index 643fb128ce1b5452335e28b5599f17df2ba961de..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_12-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9dc1d5cd8421f5e6a9297a8b4e1cc63ebbb956f5dd340a06ffabf02bfff2912c -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_13-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_13-model_00-model_states.pt deleted file mode 100644 index 232db9de78375a23ba822943ed78ccc8fbc4051d..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_13-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4b5d4738ecba61c2f2085d7dabd4493295965f98b3add0a90a08841a09adf527 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_14-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_14-model_00-model_states.pt deleted file mode 100644 index f7df9fcfccd8431adb8708ee5befc3e63a85d167..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_14-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ec732fdf47189b990f77b4a1a47ff1193f143cd5fb620d97ed718af0b3934a72 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_15-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_15-model_00-model_states.pt deleted file mode 100644 index d31a87d7dd76a32993419886fd405d3087060296..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_15-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:14772b4e2fc7991e81a16a495c9bd644bd1c7c8778651ed5239cecb5515dd673 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_16-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_16-model_00-model_states.pt deleted file mode 100644 index 744c7df6062ea113710627b8a5ea8dfa409f84d4..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_16-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c65e4cf6eccbad43398d5a66fd84875e75954b48869263f0e1cf1b9bf1834f65 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_17-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_17-model_00-model_states.pt deleted file mode 100644 index 2eb8a8254d2b6c5041ad1faf08a14e2bbfce3270..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_17-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4083f4339901157a7a57f50af55fd0ead6e32dd97be70666a89b6ed6d1078909 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_18-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_18-model_00-model_states.pt deleted file mode 100644 index b12a119d2a1bf0515d82bb4e4e662f64393e029f..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_18-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f28d53919388c09d7237135914d65f9400209446566c19028ad24af0d4a8ea71 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_19-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_19-model_00-model_states.pt deleted file mode 100644 index 5cdef194c933ee26fc18f62498753a43dc236582..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_19-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8072d23e5317c61ef3c82e7c8782c3d6baab61ae603427e806b562f6ae0597f7 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_20-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_20-model_00-model_states.pt deleted file mode 100644 index 6096a35d7521c195225dd2705765cc544184c90e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_20-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c13489178cd7db6f08b89fe176827f39fdbcf2064afe7a7adaf2036e72c220fa -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_21-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_21-model_00-model_states.pt deleted file mode 100644 index 272542a31c213ebf664291c0d850cbfbed1cdcb3..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_21-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4989887d7042c68086517c15a70a5d514994455a7987ca7c28f45e9e3d3b59c5 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_22-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_22-model_00-model_states.pt deleted file mode 100644 index 3d004d91e9b51f29d6588f09bf8ee6027ee8ab25..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_22-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6f900afa8e8a99f8fc12cd208c1488d4e48315054020f3bb7ac7ce3ca3090004 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_23-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_23-model_00-model_states.pt deleted file mode 100644 index 3fbec58d271a76725b4b791b6a9654140a1d1cbe..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_23-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b7507ee0073f30561017aafc550935bf091bfeee84f155f66aabdadec0dd696a -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_24-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_24-model_00-model_states.pt deleted file mode 100644 index 9990900e9cf88685ca620296ccd5cae30232b385..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_24-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:59821056b604e5a826e57c64a852c66120a7b23e2baa1b2f03266a8544061543 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_25-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_25-model_00-model_states.pt deleted file mode 100644 index 4ad4735360f1f9b9f67a3a347316a55608073692..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_25-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4966986da75217f9ee6902945916f4a4be22e0b361f4ad28e350df1f51391db2 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_26-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_26-model_00-model_states.pt deleted file mode 100644 index 6ed8f73cd437e71abbf2566952457ac4d8f5a41c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_26-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:65d78544dbc34456ad267d00fb7011e4acef67e4617ec3c3986688f6ba17554f -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_27-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_27-model_00-model_states.pt deleted file mode 100644 index ce061907d524118d031c72c02a5ba1d0075380b4..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_27-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:641cfabd6dcc2efe1e51554b0b420120edd6b2c414af2ccddf59056344c32a4a -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_28-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_28-model_00-model_states.pt deleted file mode 100644 index 544089771c6df62343543e04adbabaef508a709d..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_28-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:92f33e34dd50a91c926fac76b3728dbcedbc1cc43e3ace93de7edf80a2976bb3 -size 157357315 diff --git a/2b855b9bc4opt2/global_step70393/layer_30-model_00-model_states.pt b/2b855b9bc4opt2/global_step70393/layer_30-model_00-model_states.pt deleted file mode 100644 index b1dca95e521eee29b25e2f141ec52837130cab1c..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/layer_30-model_00-model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:69e2b3881d6bc11adb38be5d646d3f2f1eb3fcbcc31cbf4a5cd9e3ebc28c8dcb -size 11459 diff --git a/2b855b9bc4opt2/global_step70393/mp_rank_00_model_states.pt b/2b855b9bc4opt2/global_step70393/mp_rank_00_model_states.pt deleted file mode 100644 index e6ebe80f92b005c5ff34b68a6fd9d5ccecaf398e..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/global_step70393/mp_rank_00_model_states.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:449de953bea560aa04f7b43160b6178f8476c22c5b67f7e7c5e52065a55027bd -size 43827 diff --git a/2b855b9bc4opt2/latest b/2b855b9bc4opt2/latest deleted file mode 100644 index c83f282b74763fd1dce06b1c61c51b42d6ed9e42..0000000000000000000000000000000000000000 --- a/2b855b9bc4opt2/latest +++ /dev/null @@ -1 +0,0 @@ -global_step70393 \ No newline at end of file diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6d0a5a034ed2ad9292f466e1a227483bb00bd46 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa982714e04e5173879d7e8907ca1f82bd8bda22ab3541fbebca64843af2ed9 +size 89305623 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d54e663d5839b57a166d0f08b30f7f2e5ad3524 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b5f835ddb51519dc74cf17a0c8b0adf6a13a454f3ed3362f51b7261fe30c9c1 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6971eb008dc154281bfb3d25c4ee38f5a3273be8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a0a83e4198056491dc9f390fe0a146c6e9f74a01911f5780ddd8dc733424d2 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b6828f65f5d30c06d80037e475894a81a995c19 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee501b7625c1351def5566ad8b547da1ef61ff44f42ebe3917e2ca3d84198d74 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70d34fc9202b822d873692ecdafd272ee04ca807 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4facf9909cfafd454afb769cd28e5f11f6f1fee7d905fb337409d35edc0c3a8 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e930159fbc247ac7a52908cc09fd5d295c1e6158 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b185f72bae9093e5d06dc752907249620fbb0c660d2d4718c1f6cf070141ab +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90d86206aff05a8a6348705fe3697c47dcf4a1f0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42d340a0d466b46658e6c1c58074125ad6ba2dc75078c279ef7848c4db5fe543 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c9983dbb320e8473c099a6e2f19cc76a52d4a0f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:477f26b4ea4ab89ae40dee458e5927e1e2ab3e49dd378f6f037463cc74531099 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddd900c8fe7edb0c61edef90191d0adf2f5d06f3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b738a315ef272521f5a7552286a28aa3873a34b49cc9a702f3d1bf4bc6901d +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcc5e5142f7e6c9b0c4c2c3cea5294351c8b9fff --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217c7a1222c45aaaf5bb7ee06d631c898fdb94084616eff3dba48af4611c2bc5 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b91212a7b8c1e4dc50e161ff97e7fcfc323d4b87 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb437d115f5350e1a1d03ef244412a54f02079808b7431b464227a4b58f7cb77 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..106c014f501b1008fb888b51370480572e902b8f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf6537f9b0f3e1d13faab510277b43022217244cdd05ff6ce3e2880536f5a6d +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9dacd71074c4fb9b0bef8ed173529343d9b38e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada8c88b95c2ead1a001e5571aa82888dbb0997a4fa88bfda97f821fd8a97f72 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db56915a03ef4a4c305c07e6f93b7c1919815416 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32aac13996654507d50d338cd6839bfb2845455fb366d178d3a6084f32a6559e +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2022e3dee1fd573a05c0c76a479715512f9646af --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b676e5eb8448aad6754e2de0a544cda191d8c2f5d1d5519cdf6e1356ab683d9a +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d9f9f6d593d34fc94a5ff7f505d567ceb09c4bc --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358b839a65eedf64a2c5cf1939fa0ca6ff83fcaef26c4f360fae9d80eb49f284 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d887505a2ab6e3fdc489b2bd49b7533573fcd5a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f300e532f53f6010f8811e93f38511eaa779f66692aa0ef7b6d156b54df58d3 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46b71a736fda324f107a2ee885546c07ed4bebe0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad47b2b1b2cddf6a7a46c7870f89e99988ec09eb956ee9bffed6651648e7f2a1 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c9a58720ca6b081ed9c00b67b589901d0eeed8c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85eb9f57e162b564ee93bf8ff0e7e54d6cbd11498b8336c19a2b831d2e115c57 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fbddd4406498729a14fe1aa03ca5e0c06ebf688 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2134b5efa561efb8e25a45dae2988a0cbad71a9bf1f17073848b2fda3d74664 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daea4e53122300e1b347865c5f7ef1622bb3a932 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfce8f40c119da3f4a3db19b562ef44645e2dc0e725382dda629c1954243a393 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3bcc4438f9b186afd64392dcf76611def352505 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cafac3192e7ec28b9e1c9cbb16f0c1a1676f62cb83601b36e64c45e342da6758 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82c7216af55e573b54bd4edb309525e094f01834 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48b57cbfa2d1e4e9019b0f5aef558e24c0b1e00053570e6a28220f0886bea8d3 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5c804bd8d963cfda03eb721bf93558c703849f4 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b6b96b9ed2abd074e83adb8ef0fa83d11afa4d1c986e35e38641b78bfdc8718 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8299c356d1600cbb478f9016e7dda09bc65d08f0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ebfef188ed0e153d6e4ae9739d13bec6675054d9e14d3bb47a460fcb53b773c +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24b423a0abe90f488bfa3ff39bc39867b2b936ba --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d068a4414e726d8cf79bebdda996a1dd4e819467f73f69e2d688306aaad9139 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ed400eb464ae2fffc94eb85f27e5460c5ae08a3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8e116d13767137bb8977c40b95b59d585db7cbd13fe772aeeebc0c0ea9143a5 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e580fe7618c7d0ec93998bff8fb73795b7188519 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086a3013c2f19608b5193c2f8e2c3f7d16c2f0ee19819723beca3a0a90cf8205 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fffd661614b863594943d33a7fd94e2699a2fc9 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a446d582db1b2dfda4e2155a229434884ed04ef542e53e84642d63be9a020cdf +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e49b0166f9a202de6c785edd600efbbdd82eff37 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7ad714ca79fe8e3f83afa4772c27572b74d3c01992392d53343e71066447569 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecd6579dff88b5e2eb91a9772cb31879e487f7c5 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24684b3e40033ed67d46da85089a53eb9014b06fafc9f5231493e05f684ec72c +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4dac505df05b237644aa67bcdf6eac591268cc7 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73b9d4928e58024332d18f6c01c793b342f84bc81de7c7755c8e7808f0b107ac +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5dc35c92d823015380fef9a3976335ac2b04868 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23bbcddb4b55bd57a3b6859c6cc0314dcaf59da2c749721cab5d66609c73c247 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9e4ae4207ce022717f4e800fd3e94fd99048964 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31567a5c83be86be4856e312771aecde609ba288d38a6c3f097cf5e8fdf48564 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e916ad54d72cbbf4bb980a7fab44af6b9960ddf --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3469cc56e844878ec3cb2b1961790ff803c15e12cd67d7e3f8bbdb02c6b83ebf +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce481abc8683e8684db818542d41385d1d5aaad --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:850534ef5644fffa718e451aacaf4321543b1c42b4d7a5db143233aa05741d88 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da623984484826742ec80478c77e0b9e88ec4e06 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224fbe0f94eb1d3a87671c4d663744149966a31f8e70b913300a636e5f824d98 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfc84c357bd9054b5a90c538e5d269b5d9b34b0f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f31fa73eb077296d108ac495f08613c70c020a27948c443f69b79aefcf6af28e +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b33a15a80268632d31aeb2d23782484892b6a35a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f10e69448e1e9603afdb4d4793c4168ee6e4ee63f8a2518e5ade366e0c72a46e +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..088e3c59e0f9268ed21e1cf88c59047274873fa3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dcf8d97144c5a5b7cca517192dde0592e5e2d632bc2c511f75e3e51623c80b4 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3132a1cca69bcb83551cb8a6b0c4b6f0766d9d48 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577173d8652361137b08728d04f1856026d79ef1d2dc9b187a3157ada4be280f +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..823aa95984bfbe9628a59aee4c26069c4b125975 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1e8ecc4f9cfac56e5a471b483859e797b2dd7951b84578bcb42fade6c23b13 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd293f3c5fe7ce901f44f741f5cd937ae363322d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:103468c2c541bb702750bd677e7ce1dce94e9fa620f660d5bb25217d86b5b95e +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1d03f4f40214230c4ff0fd10c804de3b9dd1bb8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fbfc7aee194e50cc3925a349e14c8f33cbb354572625af123b089f730857be1 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4a18f47b00c6a419329064b51343bfc648e634a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1105a7a4aa85d2dd8fa0faae0c89497717143a02972983651ad2849562f39675 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8156a650a6af3d5bcc1d36e4b497109739004260 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfdb83d2082dce61d301792ce948124e133b3ca650435d9f10488c2412bbd155 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c26efba873c2953169dfc5b6754001bf637ca515 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:016a621d16a426d8b770fcc8e02e1f18da370268c83caa719c29bb108a6b324e +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bda372b5884e9389bf57dc924d800df1d20a30f2 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eb910722e2cf80349cfc962ee6fb1aae09c05e9ad97e93ccc08d6ef85ff4bc6 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04cbd6dc8e696a9bb553ba3148c92e3a25f66d72 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00210461940f5e4b72d3074f907c43481ecc190556fccf358d1dd36f25895122 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93efa02b49fb034672bc7b4edb6500aac6093029 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:425ecb2b8993f16e4653f8877bee23b6a917b2a453f1933cad1f6a7024a2162d +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6299c3e92be1814d15c240fe8aa4a453075e729c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9f39cf4958082e8deef13add6914ca67e399572a5a0bf04366843b5d8032a73 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dd6ced57b2b47535824aa36d3a9eb250ab36286 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086955551bf20a1304a9c9d20ce3b995bf3650643b555a419a1fff6453bf3076 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b1867361e13d5bb89bacc22ac97b72e869ae15e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a2423898d41be51e5dea433edebe929055154ab326171c783b6458f3329bac +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0e67d4c5f243ba94551cea763a69bf60b008806 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48a3e5581ed975bffd39297951e54855869bdc011870df67eb526cb511accfb0 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c71af5b4bd810b6a07e2da9f75ec44e61e3ba63 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02852e83868c70f30800dea0349dbe97bfd87672eb9b43b804342cca1e38f276 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea04009a009657bc14ed6d71dceb0a659fe915cd --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e83a8f3ed12593ae3fdcb12a6d4e493610ee371d432d06fa3ad4d9c67c6e5a5 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa2b3f4153810fd1a39e1ee6eefa8cb211b8b3f2 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc620b4fc19c85a365f482708c3bb5215be7f6eceee37fd75a74c51f56c4dfcf +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..914c0731678a99d7879acd73426476550ec461a9 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:969bacc14456b8d6a08f415375f54f07b9f7e157df5435bfd96ded5a344beae0 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b4ee3234afd6849148ecdc7928d59072a49f7f1 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61bceca2c797fe205fb12f5deb639f5bf3f2bb8cf70a2d715410e8048401c0a0 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..166bed7fc1045127b037a12e69c17d0a62a43a61 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c154ef803a63274b7cb8d5a2fee9743013776fa4090d89c4bbf418af104afd +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc0cf2faf98df6c4ee87e27e30536b515b1d7e4b --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7727fb351a5dc48558ef9d92bbe4160f81b2caa5053e377ed5412e3f21b4883 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e56fe4742f442face7302710889fce4fdf9992d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0571011c16af6c33cdcaf7c93796451a5bc2e7c6f9a9af5b3c3708e0eb8cbb +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6a360ed7cf3459e6b10e73cd5e8afd5cf80dcb6 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:123df0e5d75ade9b2493e63192cb2eae592d5f7d7fd03a8da96bb4aa0bec0222 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eee97c7db895d0c8a7c7d8734e67c658464f095 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88b0e57f62a0a27d0976868abb681b5834afb5e4dd6098f04aa9cd2cb045fcd4 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8442b300f13707ed3b463b6871d2c4db0a69f0e3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b632ee036aef9b46e1fb348857143c901d8d14be7f1b472c1084c43cdec8c12 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4230a29bb3ea65c534b81865521f7b6d7ec91bab --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d967d36fcf8209a8c118d50056a164a770734028d4e6ceed7be25a0267398340 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42bc7196973a941e92599fc992ddc70ad9a77db5 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a85e5f588c55b53dad25f4f495c5ec416df445378d3b73382cf876d52db4524 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..678db34085abfc6f3c87768f2a75e0fda4c36ad3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebda9f7f3d62bcbd9bda11b1ab0c4b979f824f4b1349b8ef284bd708b683c618 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20cfb973598d1fd0ad53ddbdb6d1c73124ad215c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcb9a886e0a93f68da3cdf7143ae61b1d79f88f94b5dbde29b32d4bbfab2f52 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c0e97c4c3da985f6578f8b38559c44c8ec342d1 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0297bd6d5ef3288cf19d36ef55c75139fe037d7fd95053d0c189c9c7006113 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f8c647b9332b1cb6ce172fa58ff102f30ed9fed --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea89615de8f4c23e9f515874229858efc4b69fe9102533b3d1851bb72bac172e +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d77c179ac49117d6367381f378751ce5799277b8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca70b60c8e41f91eb4a7193ea39100979d12b3a0b1583eb37b7aa19ac953d76e +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2464d02e4d8e1ab2dec3ae5bba6308171c77f7f4 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdffe3fb904e168302a5b2d7e2b2fe3661cbc8af01cb7100417e6255d0ec780a +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d2df913b62d74d32278f285a77059a1ecd54d1e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd481428794598785383023aafd9088aec7b1644c833049b98693186f9f80ac6 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b4fc9789c9536aa5f99fef0a8f4d6e8b96324e2 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0a7abb7c51f7cfce42b1929340afefc37cbdc0ba35b1755e2e8eda2641c9b44 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a60f498fd5370f950f8d64804bf703f5222dbfc9 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cb536b1e61aed279b9f623da917f87441d083ce4659b78641de005b225ebedd +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a54787ae499cae3e179810e0501b911c24940a8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b314453187fbec8534a968b704fd77684b1adcc76ce300e1272fedf2213ad1bc +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5bddc0f1e7c0e16a20b8ac928e63e3432db793d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e1a0908247d838e401e726587eed26c7a87a066c3492c5b2b25dc470a59c52 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d712a2637ba038d5b211d2598b7fa622e133f8e0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c28d2fb9eaedcd55736085f309c05fae67ae2d5e23f504ac825a8d29e313c9 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f962118a8c0feebe95dcd340ff38242f7921be3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf92712c8225c8a88e00dc5c603bc2799994910a36db00de56008071b80266ae +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e9924a87f859f47431d01cca391417b62196436 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa4aafcab3a9c201a4c35bca28a40f6333d894f0f7c452ff7831adb73c360e1 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c79727f1afc3fb6d2dea903167e2d94ccbdf492f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf50c8d56656e0fcc1a129f5b0c48ebefacfa4e58c362376584cdebebef16e59 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d85986a33f39e03c8ec8086005ecc6a623ad94d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5478456746eb86c84199e2a126b3f3aafc5ca1fcc43a763b114c1066f038ff26 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30d1632dd3ab26149477fb7baabccd506d867b05 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9c76035a7eb2e96a6ee130a84784f2c288dbce93a7dcbec20f7a8e50b1fdb3e +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54eaa9733905f46e1a308f667870d105acd461f4 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f1ede5d2ef283b6c222f187db342a478f1a4edbe168c3e91ff4c2b50995554 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..594a86a41cf7af10c90df6836cb4c407f7e0aa9a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e2fcf8e0278649adbeb87ef9556847951335668e6c3bf9d3df6d53a22cda14 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e831cbe762ecb14fa6fdb2cacb9566cf6fd6178f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b42ac1028d120cf2637c1099f7c62fa9bc623650738b82c17460fe4c9e9f8781 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2a1af550789f85b320f8b3c5f79e0bc05dd59f0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156639ab2cce89695cd83152ed31cefa2f1fc3fc71798518dac9326fbdb0546e +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27237ad13b93c77f09c1e6920ef7d5d6133bcdd0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aec045822f04f8b6f0915c7e2aa1e120304e0961ac2da41e20709777e56b4cab +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccb1150cd881e739caab23880a28c6eda4168cca --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d084ce025796954ccba580b4aa4e46518b8f82a64c442909e985730a933cb3c +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d0071aecbfc42a81671f9f7c0c5a073a1bdd18f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6c6fba288418c0228da077b9a34291ac5d815c5f7a98b23f4c4e59b0203931 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9365be9dce57a5a18c4b0a533a3c91f24e19b9f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5835cd562380a52db40a1e48c432b0937b94c1079343719bb94fca4f7d5340b1 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca77c4de8e1fe1cdc6557019ab4b6ee277e4087a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0b8acd7a697590ef333985d69575bbb60913fa5bfd8dc269e8ec9ee1a9a7e86 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5067c4404ee3027f9181d0907f22c2a5f2e0a9f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e5912850d8574db35214697ba33fbe12308559a3d4cecafbdbe5c316feada3 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03973bc2ea001872bc8740d9424e6ee05472d985 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12eacca0c3f1a80970cfe5fef5884afb804d281f67fed622a3b1b557d3937a80 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8870a6926ad2983519990d4f33e3957b6c27332 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed047356663dae12b9ba8c3a09d83c9713efe32359afb804b4485fc49488160f +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d15f8294aa4f115fb4b6f83d4c3420263c82841 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc515ec59a936a154c59744792fee9d7a1bd72394d01c4d4c53c58aead79ee66 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf814e51ff72839fdaf2bb1a5668faa2ba98deb --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf9db091269c0764981e496f2c059efc0aecdb5b1dc4236ab11b615664cd26d6 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43c5c3e6063ff024ea4aa5d3597d9336ab72b51e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d6b1cd0e02ca393d023c81d07a451739a22f49080bbeb3e83f617b7c49b698 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb6549da6e443f4c871d296abd8fc6402d9d17a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f086a5039c9be02e6b3a904e958ade7df2c417c3763ba9a7bff015f404d51812 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e44be0727760c8fa0aca7332ce0f12931eeec27 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9033f6c8f530a742ba94bf7dab46c1dcb01572c9ca74071ab1fa1c5c934d910b +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eceb7e21309faa1c1764443746ec6688a835f766 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd0b96af52d1847a2fd6b5b76c1d811ce3064834ee2ebe7c9cd568a5d079ef4 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6ab38693feedcc15996f90b674a7d7faaecc4c5 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894f0856d5b9ec726feab49c4021b98e85ee1dd4f29709f40fc71858ebc6e3f9 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76c5f31b0a3be04294d9c50d35c98078bbf298f8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c98898279867fab21c6bf28f9ae091b97dc849dff042197329565d3525fadc +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..462cc4563a2dc008ebc3039c86a561563a51c529 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64119acf51cc336c277d05c0e1f4346b350ee650daa3c86413d09e1c80343466 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28c8f0ee1d05d4df6fb76697134b96dcfa8dac9 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fdaee2bc2b06d64c41ee2a4c2a1f34a3ac4a86087a4beb6eda581cea9b26db4 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1452d114b53a75e3681c267a970a0d7f58746bfc --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c02bda7c5ff1de054ad23d01b058ebbff169d64bfe5577c77fae123e0fa67846 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f54c690118df353c985820c75f4fa77bd37092a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42bfe46aab3f7ab92b58065f42ee9a54e2f4fbf722deb515e7a1f73e9213887 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bd9f20e28ab0fe3f44e1d16f0b5e88052d8843c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61295a7d0c0d7c441440d2fcd4426976750db7a20c75b8a90c32f0cf76b04512 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17c870e3e8f854d343c73d0bb9a7008d7bfdf92c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2bcff9ca4f5ec25b0ad3cfa4a4f669f8fd2cf3228d4c936e5b090507c4d257e +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b82bd9ae68be62a6f20b4caefbad8851218aba68 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823774d6930edb9488f0dc83788a0e50d5b40b804d7187a87d9d3daaebae0cca +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a739d6b36084dcecd9beff732fbaaaaaa2cf0f4 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:826eaca6e317e00aa7f53338331b59b1c1d24e041212d86a2e6aac37467ac385 +size 89305623 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d903722ee2d347ad4ecc5a8fec6cb4b90f7a5406 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:185e91cbc530d0bbdd34c69485259dc834c68e627d5c4ed184f766593c067690 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cee37576dea80131409efeab1b61c7cda199f1c6 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3efff9c8e7dc59a3e4d5f49f9a81eb3785dac2971b8a40f2bcd48c66f7fc010e +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b9391d090c213c62d4f558daa5e9a1a359e9aa3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcce157e8170119c02b6378d789ffdc1fc6acbad55c0bb491aad4d4b09099635 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b8f2a9ddd48094db5fc0ec7f319277e1048ff8b --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2169642a586b0c5c02ff0028a8654c22cb2c60051ca2841ef096a0b97aedb52e +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..287b6982d17decc4c1316ebd03c20efd5e34fe5a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06b8a6abb14df9c2cf1d8d67885a389d628bb592159c77487760945a3203a74a +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fee7c95986f8f6fc942c7613a73bf19c4c8ca029 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bbf9ebdbd1b9a989ee5e5fa5482fe5bb3646cbc5c2be2d29a0390b727c7c800 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a2966ae8f7a5f2b3a9fece49e630f988ff7114b --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d598800e8777ec03a6f99877a2ad6b5b9bc6fe9155d3731e6659c102b6736129 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68ec163f5cdcf45e0f02daa7713a613385f03e3a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a330d467a7e59411736b13df2b0f922399803496fad4e95d89938449f29ce7 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e541c6abff04ccb5efa3dd44584f3d58aaea3f8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0151397f1fc3deb72953c387f0afe2103f796c88014e4fcd2d02666a31f82021 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d860477dac36f9925006eaaf321a20342f2933c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7578380259026f85bcbff78f108558823a5e13c97f36fb5868d41677eeccddfb +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d2cac2803a9f408a79a65e561defc9b11cc61d7 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5013f347e1a90ac2fadd4cd3ae89adb88b04459cd35a751ae904f1986ce434d6 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f45b30be27aaf67519b14c95d0e411efd124df3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ddcb619a47b4a3269366d3f48b4175c1ea71f4bc7d1b41c1de59c42ceb0c22b +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..371dcaee57c8a33e247c37c78ef98163fb7c703c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbedcc3de69dfa686a1d8c22ba47e29c6c3d1403ba250b56ffba522079fb21f8 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd5019d4dbbd643e0d3fa1db63c974d266efff32 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2127297aa0d7e937c7d52bd06c323a62a0dcc44dba3d79675099081c53404cec +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eaf37149b85e28b21f4c83e47723cbdbe6dc9a7 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8ea9df5349e793ac2b07c76aae0f8871a95caa1690d1da79f5cf97c88186d25 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adf5dce132ae467174a55e8242d766c374b2abe2 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4104999f381a1683141bb138db95b72e2f4a61006f4b820d0e09222000d95a6 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..006612cfc0aa6cce61f765a12c4b14307afc8612 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a66cc1059726b8ab6efd167c9bcbbf2c0caa392b85c8c5ab80bf434f587fbb0 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16c1bdc6819f4951797a8bb1fce41b99f461057f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e363f1ab061a145400ba18802e45596198df5f14038a068a4c04565991c389b +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..faaa5cb32fc0a5448836f8285b6300a5d0194a73 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c78541a0cef9b65e773a3508db03b534d413c168cb957eae45e6c7d4ba7594 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebd4aeaf005f9cd487d1242be880704c076731e3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58d5f433f96c86155855fc64e810fdf3da68cdcc4b8e9e7f39b3f3440af3aef5 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c2742adc5db3888013caeec1b0bc0aa133ef178 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f93319f6755575fd597d6e4be6a308916ae5ff77fc55eece6b38f9a33a362b3 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed09742d212e216667360c71978ec1cd573ecfa0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d9bc52eb722b67a5c3c2b69598899f442465e622609255d3caf10da1b52e8f +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e22fc91d0e76197f721e0ad796a74ba1f558532 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54178d1c98b64e7467d956a5135d7f818a9c16859be9388b03dbc5492b908637 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6e8a0a7586fbc353558a48bf8630d01e9485c5f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28ea04e496915a11b4c9fe637b04d57bc801394c2e990761f3131dc2b3204cc1 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c62af4d7279bb0be77240c8a902b5c8096cd2c8e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a10ac39fc3e171a3f7f35cb72501a86f814a41dd38627f0c9b8295bc03aa18a +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2723c6d4856fa1cd92681a3a99c89ca2a776c07a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19bb59cd2ae814a76b89162fba2b840af5e73b3df2d1170e7831adb8e3d4ffb6 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96d28b18af4ca53fb5c91bc222b7b17aa7c1b3e0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ea0ae20a0aa871f44ebccf17817ba7e4356656e0f4a1108d72e6e253a5b1d2 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e46da196869686e952ca88a5f62b967d8d268aa0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071a9e751ac64da34d21586e26344a53fe871e3809e5884594dbe421f9d9bf6d +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a57ceb61ffe77b58fee09dcd98f80442943f5f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b745033745e6866d8e7cb7cbbe63b632b7390b72168d437a78a6b2c2b6d9fd6 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6d0486c202ae6455dfed871debd722bbe2b1e08 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c94452bfb32d9086bf2a551c79198bc968bfb47607cfe9babda543dcd50db0 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcd834c890e8bccd080dc67b61a518a2a0b672bc --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae04e04dbdca696bef3664e7cb5aea475dd63cf7fec4cf6b196ebe3490df7e70 +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78e35aeeaf7b2f0b24cb24f3b2459713af6d95d5 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfde63d20e06a4c28a6da4aa2b4499e40f3a9c9b064764e69cb7fb0f9349a69e +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1156df6e8ee557616e9d96d2a8b11878f8bb30f9 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1866a4eb40dd3f1f9eb99d321b4d9880e99d77bb05f1a2da8d0965fa3b3b42d4 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e37639e384aa8e0f3018937ad41ed2c6c4d019a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5389d9305e968655cbd119476a12fe087df0586cdb84bf1c06b0492f7da83bf8 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..744270b00f83cf4b9d27586ce62379003ed7d690 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e957f97951e04df9b1cc9b0d090182a4340ebd2e153118a027ad4d9c8d25c76c +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0faaefd82ebd659469ea6543ada923949694846 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2485f210b3b55fc7bdd9dde10c2876d8f7953e6f25aa2d1289de4b74b9412fe5 +size 89305837 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb5763c08707854cee0b5d195d5ec310614428bb --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbd2793e15af4ec08c1421301b23c90a07c001126223663076c5e1af5f520b4a +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6c818785a06ee0eed33f48246a2c6cd3f0286ec --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3008938a1a6445434e790f83722993ab2db91230d83938440fa7a42d5133624 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9629f175f8a7e25aadcffc01848c0b823f80f4e8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1d369863020f1617472ac062e3442f7b4fc081b2309315f43a4f969b816b52c +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..031270112d935ca9a25982d3901cd18907ce8b21 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acd4c400e9de3bebb946df7c748da3d37f94302be8a8ac1b6dbfd055b50331f8 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dae61cdbdbd964e86af17a740be779622e0c44eb --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aae547ba4b60906606af26cc5074e26c7c421dcd0884274f72c87d63ae326a46 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b96b66f9cb3627781ac218da33f9a1d2c952108 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc5924a133ab0ac434ed64678f2f98b6be4fb2d7800c117c0ea13f1181aa5b3 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9f82c304473b5bbfe9b2d8c6481b23f6c85ee70 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da846be0d66886f13dd5e49a0d969aee57e63340be3ef3771580b32130aa6b5d +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aa7cfdf5a36aae9f2c2e59f1df155aac0a1b744 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b7fe13ffe96bdc5acb6633a22cc5fff6fb9fd5a5aac0bb7d8a56d7f053189f +size 89305762 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f96caf2ccf63cfa47e08ac196d941395ff68a96 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d31b4032fd752115941e9e60901603beb4b6a29b39c210198983350d4645b04e +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..786ff62b4f4f756efe54f4b31f6478a1bf650507 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a982435e8010dfc8613ed17c0123d2a03475dee173796e9ea69d33c5855acc1 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1766599a23020a3aa14149131529afec36e9c0bc --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e16a7919033f0d83066e41084a5f42d951d56d8dd3dd238a28cf6512baab1883 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9978c1e1b17b2138e80943088a6b0554fc9692e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d17c35c62115c06364e8c22857abd7def1181c0dc1c3c9c6b4033e1f3e499f7 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..580e7111a316505e5ab72bc05554a487280541c5 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf5bad0b509c0f68efd5d19a3bf997bc104d49af8d6fdbc82d23bfcc2d2548d +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68a9081a054f22a6abad3579a4f4e17076e7af89 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a429b07486271dd632b424a5625c6b66e78d674ccc1674e4f8dd4408aeefde7f +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7677a19575d3854deec9b5415daecd0f053ba47 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1382174f470e3816922303e1186d9b52c2fc96245fa3e6da759a861d05ddcb6 +size 89305709 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f5c1e690f7846733ac33d01217b05004c58fed0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:775ebf011db81ca2c457737ee4ba24f15bca58d6f31902d8d4bf7e748380f299 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c92da775eecfa45999a031822493f4e3ffc48ed1 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5851a31e4dc32a86de8e866a89d62ec780cd04f761b319e65257a754325185ed +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa9d210cf23160c3834dd860152a779466eadfbb --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67d7f455f17e20b165caa998a756059a008dca8b78d46cd3b87a0b2fa7f1ec2f +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1657314b12208598830045200662fddeb6988117 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db9eaa53970019781ed3335ce62afbad5ed41b39860c5da7e9a646203b266228 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50dd098fa6189b6b014e7bf9d67b99fc3573dd79 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0704b165387d9b923c3291f40044cad0f9783a506cb2a9780922dca0e516a2d +size 89305773 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2978ae480450a53e83b7b15000f85fbade9a4775 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d105290b3ac5f1cdb0931c8f29e339ce8690f17f8e61cf3c35a8c2643758dd14 +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc634cffe0468643c3c564fe0c8a301bcd83771d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7a6d52631d2b8e3ed4f8119070c4629dbeb321b60800e37b3baf2c097d27eca +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0398f8a1cf6b263b6570ccb4a8c40f660c33c98 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda3c948cb5697207f311f4224b332094e0598e159b7150f8c485afed17bf10e +size 89305645 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45d1bf259cb09935a839ce1d87e24679d49efb24 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:359b78d21e1ec5df8c72dfa7eefe0c99f5e33c21e81fe88cde6313a7a824d4c6 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cade3af46110836fb5ac3937d115cb3fc49a13d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5435ad327dc8a75c0bf3bd4542755aa46e38b44befae99f06381590f4ead5462 +size 89305581 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8042322f96fd83b75a0d68f44203672579d7ca9c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:966f42938103326236e2e0dc455905a988bd299aa8966a529ef78eb53ce02c81 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a443b43bc88da6d3ce39986d1244fe423bbace90 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2284f53e0c2780207bb79e20b256c8302fd7046443e828774e2adb3fd5752544 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..365e400d33b8f802bd14e595649823c4b893bd66 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ce0352a36437961a279bed977d19c16781470a6183699d62c5fece5e11ca41f +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..384e8c78784e4be1a9e9b9111629e2f1fb84d1f5 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b9712cd0c02dcc74c57c366faa274d84c3a3273569f11b0d5e908890300e2dd +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b9a38c5dd58263c64fc4f5708291a5be03b9371 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa522c877d0e267df5c02b87706f063b094a8c714a8e9c7de9e84a38689f83b +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc35c56d3608661afc405e6989ba81c1f4fa0fb7 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4211fc80d3c9634782135f183e5444f6383426657ebd01cd87c5338a85640033 +size 89305559 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aec8050dd8507a8ee567eaa6b6a843b136ab02d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42cba6b620f1918f8e893e2e87620deb08bfae772e39246700b1656586ba09db +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e78a5155e788b9c4e8b0a9760f3d1cd7d9e7ec --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef90d5637a7f115bb808c0fb39877df66ea8c1fc44c655787ddb119335828caf +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b71cc2dc5da374e01e0cd89ed813f98b68e4eb1 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d868ac93dc3d2a15ec6c79cf661a00604058f74f26e509e51017752a1aa57d +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42475f6979ac17242da061e8a44e85be8376a397 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ebf0f1df99ff13b484217ea45dc4e937d7d96240555261a0b700c79ddd25583 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..227f39b4c562da245cb9e8e1084298c2c9d96580 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67780b310d6a356ba29321887b3ab3585b42e5f94c392a5f85ece5f69eb81020 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6949d06e1be149ab19d43ffe1df074a87d04c540 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f9365325f794de749fd005a36f95f02897ff4a92038911afe10694e762b295 +size 89305762 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..328e0066c332ff7bd49ba273b9fe399a6ee3952d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc7ca7de1bb2602de55005e9e3fca7be64fe292f4fd329a0ac24e2cee140027c +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d64b5aa105a6911709fa0366c7dfeaa103c6f62c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5dc94b23c8af1f4902e17dcb7cff197995813a5575eccc9d9e72907237a9a42 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43510d865a99ce656ab0bf132869d0a5e299662d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a4644d8b6fde3b09a2df38d0597c250277b067a971cea09f962a90c3df33ac8 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd5e3ee2dfc9d1a5229ee18c754fc56d8e6ede16 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e13bf2534db3e59a398ba7decf29485295e3ccddec8c97ff2df9175feda7ea43 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fed2bd3720a3b91e90cd7a4f4c59e7a7984d693 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e3da35874441f1d7d155a522062132b9dca91f8fdfbe8abb34b39d4d63e7d32 +size 89305623 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f8e56232ef5238261ff767bedfd827707b14a3a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e927f1a6dc7f474a3e9aa1d50d22794d8cb91df695056477c409ad3019d2b9 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc69b48ee4d03f2a3fa877931a0248d256241a7 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d94a12e7df6691e0372cbb3b8ab9816d5f63454bf7d6001958586283c1041e4 +size 89305762 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54fb67e4eba7a5c82b36273386337090f1014327 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae86fb049f0d14915f9f74becf0865138226b9889616e5647201fd7bd37ad2dc +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0b2b786e536557b2ddbd5115a7c5115c6e3c554 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c0953ecb99b9f3b9bb11db206383d29b5854ebcdfc0531929f0e228086fd81 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7617d2b3623e4d92c974ffd4d006b19e85355390 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1fc718aac7a1aeb79fe54cfc6177a9391ae8b257c04db5d576b68dca72a3a12 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..deba4ac80f6532d3caa960e981f48c3a5466e1c1 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1068b9246798184326a7df25fc7ab3385eb98be6b21035776fc52af1db4b554d +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6632d7eb43d901315ba7b4c0d771e28e4634e70 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239c58b815ea3952bbde891a87932bac0b31f8268f8412f337a4c7aeab1417be +size 89305762 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f112f3df938412e1e0c442fd0e09596c8e52e88b --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5afc9a09663ca2cb6be9d111de8e0e7ab550d546531fb08d9b8442c263f82d7 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b5880c0e967f7337095e4dc84cff26b87d5dbce --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94e2c42d635fd7ca586313495be7481581124ec1cf514c85c7ea00c312c49848 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..334eecea73fd2387c4183e370008d5f1795844aa --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d222783c42739ed620b886241cb1eae59590f510688d6426f4728d654774cb6b +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5046487824a402d419be22e5f682fbdb6e6c6c31 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b539e746e5652e00929b4d4f540b7a130a1eb712e91c5fe403d6114c7285e5c9 +size 89305687 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02c25bfba606a43cbe05f4b2ea08cc0daa3d1cc8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57d4953fc4a5910a7792a24a2d6d36256764e1132e663c0af3df224a7d828844 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e80dbbf815b9a8c5173c1d752f6932fbc9cef44f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e20c95c7c88ea1dda3559a53e0cda8632b15ab6671949af41cf95232b617de +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e38b4b8b1a1779d92ea9f76efa2219149d4b73a6 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:747121c86fe79d69ee2296ee14bed737f69b1d7cfc06c5d30550105b3ff43c36 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ca04f15a9e6c76e4b47fc9faeb46e91267b2319 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2724070f1c9d094ff467d8f2fb98f8afb091ef0491f00825d27920fdcef3a15 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc2839d75fb43c8992386d88c3cbb1c6c280657a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86b0566e4178f1d065e22f5f714a54d3d5f1f68ab40c61340ecdbe916e3ba3a1 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b53309bc1fb942fc185583e17bc79fa5612321b --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84693ebe67ac477b3c8b0ba35638a6f9b424d597a0726501bd9b12840f60528 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..682bce1a5b570c01fb7c112444eeb50e005e475e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a85287de2ab3459931e11e1d16bf375706a53a3a636c4374c285be2b0a9bbba4 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5560c693ae000d163d53c87382f2f4db4df3bd9 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c6f8ab32db719d79f675f4002b282d8e332c6a0e47f19c20ac4c2f473751bb9 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..553533babfba9e32e23f957b2ae6e2154fdaf8ee --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022431d6a5da3d6dcadf5f9f3d2bd5724e6c7d8699a16f35ec3d6758e8910cb0 +size 89305762 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81f0e0aefaae13140cc596fdaa025686b686e2f0 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89adca5192b17ff726ad7819948e155c32b2f2b12b74d6861b95fd8910cd5d81 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89d2fc6df49c9c876c068f6afa1bb5979d6adca1 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31516fe3a7fc69bd4d33fdd92e9c699dee07f4ad69655ca747ba51badff699b3 +size 89305687 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d472731254034fa6e5210d2dc151baf80ee4d603 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574b76e4a6babdcc0fbcb6d6e5e8eae7644be1ce8a02ae5dce1d8cd0d0181480 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2b56c8ae213d16cb231c5f21da61d1e0e635b29 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c189c4685b9f3dcb51fc37dd71a80a1371c086ce797958835288f10c22b677b +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..490606358d65d74091adccbc3e905b9f334196be --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82c7dc74400c80b2de8a54eb9789a066964463d6fe3684905a68d3acd11ad32f +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a975b132efb99b85a05d415c70ca731c365ea9f5 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e217fdba2e79342d079fbfb14f250735f7bd89329f0c79bcd30196adcdf9a2a9 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1998c3fc3768c2731c6c4b06e169c4065b8bc41 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72cb8bd26ed3a95ce5fb0a0ef3293e4c24b47d76a1277070bceabbd5f5559869 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34443ad7e9f51f7e15f0a469992947fe7ba4f7a9 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f7ff424ab2992094fc49e72403eb39d69f973eca2160a2e551cde8a36a369a +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62afe8956ad96f693d34d77888a874561a9ce4bb --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c329a55abbd032d649d3272985ee89ddf46cd598cb63d9ca507de3be9681dca2 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..145e893dd70c74645f60472b008515b76a6cde07 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9386c4bf07e86a4a417bac69ccbc2f0d7d150ffcb67082ff8bc568002a79f084 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96257a2aa58c949be91f028e37d7fed9e46fd786 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24136c68bf8e3eabb4601b6192dacbeb5e80bf8df13b5cc8e5474a44a6b5292 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56405e33d50ce4b11ed03ebec1bddb0b6ea7d555 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef83d5570bae4c849000ec682bb8abf6ad139a5692c5cc522bf678c7725e8500 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dc05563925fef8dd083f354186faf33f354fdab --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbe37acc1d237c6053dd017a44c43571d8041c784a83d59f944a9725f2015fad +size 89305559 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..580a239c1d4d559eb3e3a16b3c62fa650dbbeaa1 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308d401bfba9ca7051ed5479c31af7a5e94306c245f54b8f599c01e45f2418ea +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..225cd25f81e64586af1a4c6ddbe98fa6c16319bc --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b9f9122eb59022263ceb2a91779bcbc814c03772fe68f316a3758bc428c071 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5b507298193065388336d7e1da736684093242f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c39cee571508109f7a961155a1a5751961393040a5bbf4adaccfe59ebf8d97d +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cee693367a1683e35154c34f68b7d9648483af08 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2af13b821c0def39aca681950687ceea308e997d7ab71f219347cc5584ddbfd6 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfc6839c5712db29d8e5b6af1fcda4c3c7afb666 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e89372c2395cc3738f662ccd661299aa6e32c6f34c0cee48a3e97695adb0ac2 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2412216b965dab7600091219fad7364edbe6118f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:491b39a90cab8543731627af5c4489d34587b7bfda20db2b33dbc1c59da5848d +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56dcfca98d0f061453b4af7927ab07cd5a385314 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df35e9c76cb0f4a9dbd7a543ed8d6cf2dba48e813cd6cb5715680bc03e14bc8d +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb3ee87d5398c64cf95bc1981f530098043d428 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5e6b9d5a1c987c8c2557a86f3d84d38fbdcc6d6f7459b0897ad4a35d4cea06 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90812d8133baad9b93fa62079ad4108866144a7c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aacdb9557bc7d375ffcbac2765f0aaa3493a08bf28665b0cfb4ffd59481116d +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dad2a2394eb73d88b62978e0433df0ac34798982 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bd9f76e3d55a0e945bf41a3d4e2cc953a7f61a32d66b6f61272e699145f6b35 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af503c25311e53a05022a82bd17fa1250a566954 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef9f357f4329a1f0e08423484d06922955977a68e490c8c0af8caf3fefd1d84 +size 89305559 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de1ce5e0fa5898114385053c6b75378507925085 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a876daa59f7f4a9b120841b2ba73175a1239b027af7f7b714cf90f35eed35647 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c94477e3b1e1013095a16df45bb49ac350084d5b --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df23bd191640698bb29fbe6745bb5e51aeba230af6dce199d9aa72ec727f92c1 +size 89305762 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09f9c8845261385b1495d81a4f8e2c461f928f0d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f167b9483604bb223f35f7faf738c3dd7902a85a7e89d0ae13bc0b563a808f9d +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fe023278e2d900823702c7f3f4bf2c2e9af3f67 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232fdbe4ae9e04ff5d2d2cb190114b57540e05518908145d595a981f1eb73139 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..354f6ca5663892ff22e832420b303c1669795e17 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738517dc275ce528c7aff0081de4dfab1ade25e319f388934522c93c6820d024 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adaa4125d029539c7f13862d38bbb890e068a905 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5854831ec5d2bd01aa3dea43ce0c24ef4326fcd55f2b5189e147a0e828e90e92 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddec5e5b6508612160367e6fc75e77eee92a03d6 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c5b4b5a07793f1eb517b1805d37caddf81a059da6558d9c28e0e61664583c26 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5dbb4c465111bc1a779b446cc5f732372740f8c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1fc829ee6c07e5c284fdd301f4d8149a825c4392883a2d6f6ce61755a70ad2 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf76eb44e3107270d570571039873c75b74eb837 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70633538228c4a7c96c64adceb11cfa56bcb6f4d5ae1c5e489be082d7cb22aa7 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ac51afa5ac2decf55133be04c2df17294169fd3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27694e88251abc513b5490ad30907a298813648cf2a86d30b01a3122a614345c +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..569d9faf2f32898e201b6d678652f3c46268303e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a6fef7c09606e541810258819a4e0fb32b36c31b885fb1f24107e642ee90a33 +size 89305623 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2b7692c0e35e0106ed35f04e76f69f72e3a1613 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4606e072994c98399ef1cab4652d9f06488aec2ffa595a86d16841a042d157c +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f9fc2b2c7681de14b0d19fe1c42bc19be0bc1cb --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0860f063b214cae505ec54566569a228b81cd0eb8fcb293d261951da4497e9b2 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84142e77272a687d298f76970758fb01ee10586e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15a0424c2648b6610e4fe04912528cad67850d651c03a25bef7f952aefbe1df3 +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d54547a7a57035e1cbdab5f7599e856567d07c2e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5033e559a57bcf39d744a2854058454774071323154edc39d6c1adeb77d68fa7 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8228178a67ebb4da6ab1a78b512265a7972108d6 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421c910f86264a273baa6643a8f96d6938c971f523d823877b526a531566ea6f +size 89305634 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e55905ca1a3fa3847e01963043a6e1904d02f44 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e3081a72c37c5a0d100be6acd616c1566488b7bff1eebcab8944240d87298c8 +size 89305762 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e30520845b9b110b8859f25fb12064aa22c6fb48 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eaba0125e4370375600fe66d8c7dc0b118d05108654fcf1ea631976644d8127 +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31017edc270569e08fbf346b27d152deb2994fb3 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a941daed2a2b7b17cdeb689b406c443dbfabf6270aa36c073013a3df1682e3 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e669bdb49f2cc0b15a84250d3b4947799c3a0318 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4ba962255d3bb5436706eab7cadad1953e347eaa4028dad9c1e9998df8bcbc0 +size 89305570 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a3aed3622658580b9e21759820d2c3107fa17b6 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee89e2dfcc23ea60ec58981cc1dfb0fc94d22861b6119c4c96e3bbb38f9d94e +size 89305698 diff --git a/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2758f6341443a5793d0d07a34ede85c9d7cc1ad --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3471931cdefb12e0a94631600a3655be2da64562730d81809e7aa96f091837c0 +size 89305687 diff --git a/2b855b9bc4subopt/global_step70393/layer_01-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afffaa1bdfee039f6a29c4cb47baebb3745fbb3e --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceb7561e97daf4dfc1c57cbaee9603e3e350a948595a2b157a8c56e5d19d19dc +size 241239299 diff --git a/2b855b9bc4subopt/global_step70393/layer_03-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cffb6914285e86e3678a12b836bff2093380200d --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f4205a17fe5029e2e80706991a2d418aacf8e597f64073be9a482da12e9313f +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_04-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bedddc877647b46dd18dbbfc1a71385d068658bf --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7697fd50cddef42b4bdfcd2db9b52075dc6278155ae925ec8e8eff72281caf09 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_05-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..648fb0d81d035f07f3d35d746c300100c7cbcc5f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2420e48edf2c9938b19028b6209fe72cb8caa57646f1681c0420d8d685424f0 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_06-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02bcbdb6d61eac793883a6df4ea5bb30f51de1ab --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:731237d4ea735ba05d62a1263bac8eb134a38e3efb25fbb22363b41bd026c0b1 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_07-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8766abb39c670160cb51411314f57123323c0b4a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04235917a2a905bbd10e1e9416bea4776e7281dad4bfcefd2c7975019af4b018 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_08-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5979b5c513ff1e652f32e07e1706dcc475085519 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a54d536e8dc409e071b83b0ccdb18914b680ddde030e0687ea36e512a463dbb +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_09-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bb14bc335046b2b6759433543f0beb6a4351996 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea0808fe68dd8e50859d151731bd0e13def2867929fc03fef93b4a9efceb11a +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_10-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3fb6595b9be6a4a231602995d3c90cf4098ceaf --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79601a3b6299658a1aa76da1ad2136fcdeec608207b82a7380117633c6482b1b +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_11-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c9545ff2b8941f9ee698489fb7d9a76148526fb --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08baffe7c63d9c9f31b62ce3862fc6b01ac8a8ccccf060c08bfa43b34e6c34d8 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_12-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb344f7c66f41e2561ebe639055152ea87a63399 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b633e02b32f1052a0ce34446f7346020f388008a867698685e2f6bcfab51c173 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_13-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39b80e11a5796afcd7813c9b1f4dae4d4a4d5e09 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40040e5f4eedfd6ac917e719ff0f90aee27268833386d69f42f05d0b3c35ed69 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_14-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c6cd50de246389ce2dd995d17c74afbccfc5750 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e752eda487841f592832ed558db9fddfc167850f6f8c4f1c448cc41c3fa626a +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_15-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c9403b898453af906efa9fd17779ed044cc9c33 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda59a0207e9909aa63ee819b281347df6c5a38d6d7ad200c45ea33bdd01a1bc +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_16-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f73958f3e8240fc85162a7023e2ef3414c37449b --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134f26f3dbc82e569c670174717bc1206a0cbea8c04b0d888ea515a080e47cc1 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_17-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b5a1de23fb947cc42b72fe48f3596d2d31a63e6 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6879f017c1c4011eac69a9a0b334cbc5158267c67028cba80a4c5c9511e2da16 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_18-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b19860b8995ad16121d0991e86bfa805bfcc02f --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d91ab4365caad4868cc78296bf37f6d4d2e937b1a26af311297e854b6ce04b4 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_19-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..810c1532be61ba45e5f5ea605b1d73f1c6ec4f54 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c2d0a517bc1543f4b4ce73391bcd036f44daf20a5e9698160901ddda29ce1b +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_20-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83acf6ae8ed8176787296a7d35e13b9c8b3bfe5c --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370692724712e0347b20f6e001fa67f1085c90a663a35c91d7faa4618baa7240 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_21-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28b9318dfe37b45e16e38801b459d66b661c1d46 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a4314462218d301297814684c7a520783268dc1f7b7ca7c77b427289b6cc48d +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_22-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..399d9a2beb961cc5b4b579bcf90bd832ad8ca65a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e20b04c41b97283e69d65d8cea3947866c93dcf1872f6e2cf2daf4d2b984f1 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_23-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8d1750f1ed57394ba2c2d43502c64aa6d81432 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:220431ec42e0bccb66426a52629a34c0a726dfd44959cac9a37826b371b2ba8f +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_24-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b50d983e8f6c6068a132d14fe6b233c8246e6d0a --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7fdeedc73174b20030a84406823a4e727427bce22f8c044e1e12c62fe9b9350 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_25-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02dd2d87498b75422cd802bd66367449db467af5 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2be20b7e05b1d7b2f5f3901df724fefaec814c78871d9c778a96c47814727977 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_26-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..314f7af4fb0549a1b14ce9f28dda7557e7a9f4e1 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00eb89ce9ecaaf423253f920267742b843e2249f84997fc40f29cb120985f04d +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_27-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbcfa7f23a873a5b719c6479d1bce197d43a8fbe --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aad061857ccce5729f467306255f73aa50c3a7fcf3b800d3c62906adaa1f9d9 +size 127466243 diff --git a/2b855b9bc4subopt/global_step70393/layer_28-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ac5a98fd970c695c01c76846788bbf02fcf100 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edba7e68edcd80b14f75eb3fad39391f89e46107ee4e7def84a3e24d2c9baac6 +size 127466243 diff --git a/2b855b9bc4opt/global_step70393/layer_29-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_29-model_00-model_states.pt similarity index 100% rename from 2b855b9bc4opt/global_step70393/layer_29-model_00-model_states.pt rename to 2b855b9bc4subopt/global_step70393/layer_29-model_00-model_states.pt diff --git a/2b855b9bc4subopt/global_step70393/layer_30-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6377fd21ce328f6213a99f0e84862ad502afd2e6 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f0d2bbd1c0fc90082187a5b8edb29d5bb58724ab3c43ab217630ff22a06b14 +size 127466243 diff --git a/2b855b9bc4opt/global_step70393/layer_32-model_00-model_states.pt b/2b855b9bc4subopt/global_step70393/layer_32-model_00-model_states.pt similarity index 100% rename from 2b855b9bc4opt/global_step70393/layer_32-model_00-model_states.pt rename to 2b855b9bc4subopt/global_step70393/layer_32-model_00-model_states.pt diff --git a/2b855b9bc4subopt/global_step70393/mp_rank_00_model_states.pt b/2b855b9bc4subopt/global_step70393/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f4492e05d6be655650b9fcede3539e4fb1a15d8 --- /dev/null +++ b/2b855b9bc4subopt/global_step70393/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c52549bac982cbbbb3f73bafca0a98bf901a09a23104e89098b83268799d1e +size 45363 diff --git a/2b855b9bc4subopt/latest b/2b855b9bc4subopt/latest new file mode 100644 index 0000000000000000000000000000000000000000..125e9347a49ef6c31c1e274272e3ee0c7333db28 --- /dev/null +++ b/2b855b9bc4subopt/latest @@ -0,0 +1 @@ +global_step70393 diff --git a/2b855b9bc4opt/sbatch_2b855b9bc4opt.sh b/2b855b9bc4subopt/sbatch_2b855b9bc4opt.sh similarity index 100% rename from 2b855b9bc4opt/sbatch_2b855b9bc4opt.sh rename to 2b855b9bc4subopt/sbatch_2b855b9bc4opt.sh diff --git a/2b855b9bc4opt/sbatch_2b855b9bc4optval.sh b/2b855b9bc4subopt/sbatch_2b855b9bc4optval.sh similarity index 100% rename from 2b855b9bc4opt/sbatch_2b855b9bc4optval.sh rename to 2b855b9bc4subopt/sbatch_2b855b9bc4optval.sh diff --git a/2b855b9bc4opt/tensorboard_2b855b9bc4opt/events.out.tfevents.1683212808.nid006360.93395.0 b/2b855b9bc4subopt/tensorboard_2b855b9bc4opt/events.out.tfevents.1683212808.nid006360.93395.0 similarity index 100% rename from 2b855b9bc4opt/tensorboard_2b855b9bc4opt/events.out.tfevents.1683212808.nid006360.93395.0 rename to 2b855b9bc4subopt/tensorboard_2b855b9bc4opt/events.out.tfevents.1683212808.nid006360.93395.0 diff --git a/2b855b9bc4opt/tensorboard_2b855b9bc4optval/events.out.tfevents.1683353640.nid007164.40266.0 b/2b855b9bc4subopt/tensorboard_2b855b9bc4optval/events.out.tfevents.1683353640.nid007164.40266.0 similarity index 100% rename from 2b855b9bc4opt/tensorboard_2b855b9bc4optval/events.out.tfevents.1683353640.nid007164.40266.0 rename to 2b855b9bc4subopt/tensorboard_2b855b9bc4optval/events.out.tfevents.1683353640.nid007164.40266.0 diff --git a/2b855b9bc4opt/tensorboard_2b855b9bc4optval/events.out.tfevents.1683354122.nid007164.48318.0 b/2b855b9bc4subopt/tensorboard_2b855b9bc4optval/events.out.tfevents.1683354122.nid007164.48318.0 similarity index 100% rename from 2b855b9bc4opt/tensorboard_2b855b9bc4optval/events.out.tfevents.1683354122.nid007164.48318.0 rename to 2b855b9bc4subopt/tensorboard_2b855b9bc4optval/events.out.tfevents.1683354122.nid007164.48318.0 diff --git a/2b855b9bc4opt/tensorboard_2b855b9boptval/events.out.tfevents.1683353043.nid007164.30549.0 b/2b855b9bc4subopt/tensorboard_2b855b9boptval/events.out.tfevents.1683353043.nid007164.30549.0 similarity index 100% rename from 2b855b9bc4opt/tensorboard_2b855b9boptval/events.out.tfevents.1683353043.nid007164.30549.0 rename to 2b855b9bc4subopt/tensorboard_2b855b9boptval/events.out.tfevents.1683353043.nid007164.30549.0 diff --git a/evaluation_small/2b855b11bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv b/evaluation_old/2b855b11bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv similarity index 100% rename from evaluation_small/2b855b11bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv rename to evaluation_old/2b855b11bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv diff --git a/evaluation_small/2b855b11bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json b/evaluation_old/2b855b11bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json similarity index 100% rename from evaluation_small/2b855b11bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json rename to evaluation_old/2b855b11bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json diff --git a/evaluation_small/2b855b14bc4-results_lm-eval_global_step52452_2022-12-23-23-30-13.csv b/evaluation_old/2b855b14bc4-results_lm-eval_global_step52452_2022-12-23-23-30-13.csv similarity index 100% rename from evaluation_small/2b855b14bc4-results_lm-eval_global_step52452_2022-12-23-23-30-13.csv rename to evaluation_old/2b855b14bc4-results_lm-eval_global_step52452_2022-12-23-23-30-13.csv diff --git a/evaluation_small/2b855b14bc4-results_lm-eval_global_step52452_2022-12-23-23-30-13.json b/evaluation_old/2b855b14bc4-results_lm-eval_global_step52452_2022-12-23-23-30-13.json similarity index 100% rename from evaluation_small/2b855b14bc4-results_lm-eval_global_step52452_2022-12-23-23-30-13.json rename to evaluation_old/2b855b14bc4-results_lm-eval_global_step52452_2022-12-23-23-30-13.json diff --git a/evaluation_small/2b855b18bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv b/evaluation_old/2b855b18bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv similarity index 100% rename from evaluation_small/2b855b18bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv rename to evaluation_old/2b855b18bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv diff --git a/evaluation_small/2b855b18bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json b/evaluation_old/2b855b18bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json similarity index 100% rename from evaluation_small/2b855b18bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json rename to evaluation_old/2b855b18bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json diff --git a/evaluation_small/2b855b28bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv b/evaluation_old/2b855b28bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv similarity index 100% rename from evaluation_small/2b855b28bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv rename to evaluation_old/2b855b28bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.csv diff --git a/evaluation_small/2b855b28bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json b/evaluation_old/2b855b28bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json similarity index 100% rename from evaluation_small/2b855b28bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json rename to evaluation_old/2b855b28bc4-results_lm-eval_global_step52452_2022-12-23-13-35-31.json diff --git a/evaluation_small/2b855b9bc4-results_lm-eval_global_step52452_2022-12-23-23-13-03.csv b/evaluation_old/2b855b9bc4-results_lm-eval_global_step52452_2022-12-23-23-13-03.csv similarity index 100% rename from evaluation_small/2b855b9bc4-results_lm-eval_global_step52452_2022-12-23-23-13-03.csv rename to evaluation_old/2b855b9bc4-results_lm-eval_global_step52452_2022-12-23-23-13-03.csv diff --git a/evaluation_small/2b855b9bc4-results_lm-eval_global_step52452_2022-12-23-23-13-03.json b/evaluation_old/2b855b9bc4-results_lm-eval_global_step52452_2022-12-23-23-13-03.json similarity index 100% rename from evaluation_small/2b855b9bc4-results_lm-eval_global_step52452_2022-12-23-23-13-03.json rename to evaluation_old/2b855b9bc4-results_lm-eval_global_step52452_2022-12-23-23-13-03.json